Mock Version: 5.9 Mock Version: 5.9 Mock Version: 5.9 ENTER ['do_with_status'](['bash', '--login', '-c', '/usr/bin/rpmbuild -bs --noclean --target x86_64 --nodeps /builddir/build/SPECS/rccl.spec'], chrootPath='/var/lib/mock/f42-build-55737982-6538420/root'env={'TERM': 'vt100', 'SHELL': '/bin/bash', 'HOME': '/builddir', 'HOSTNAME': 'mock', 'PATH': '/usr/bin:/bin:/usr/sbin:/sbin', 'PROMPT_COMMAND': 'printf "\\033]0;\\007"', 'PS1': ' \\s-\\v\\$ ', 'LANG': 'C.UTF-8'}shell=Falselogger=timeout=201600uid=1000gid=425user='mockbuild'unshare_net=TrueprintOutput=Falsenspawn_args=['--capability=cap_ipc_lock', '--bind=/tmp/mock-resolv.ch_as3uk:/etc/resolv.conf', '--bind=/dev/btrfs-control', '--bind=/dev/mapper/control', '--bind=/dev/fuse', '--bind=/dev/loop-control', '--bind=/dev/loop0', '--bind=/dev/loop1', '--bind=/dev/loop2', '--bind=/dev/loop3', '--bind=/dev/loop4', '--bind=/dev/loop5', '--bind=/dev/loop6', '--bind=/dev/loop7', '--bind=/dev/loop8', '--bind=/dev/loop9', '--bind=/dev/loop10', '--bind=/dev/loop11']) Using nspawn with args ['--capability=cap_ipc_lock', '--bind=/tmp/mock-resolv.ch_as3uk:/etc/resolv.conf', '--bind=/dev/btrfs-control', '--bind=/dev/mapper/control', '--bind=/dev/fuse', '--bind=/dev/loop-control', '--bind=/dev/loop0', '--bind=/dev/loop1', '--bind=/dev/loop2', '--bind=/dev/loop3', '--bind=/dev/loop4', '--bind=/dev/loop5', '--bind=/dev/loop6', '--bind=/dev/loop7', '--bind=/dev/loop8', '--bind=/dev/loop9', '--bind=/dev/loop10', '--bind=/dev/loop11'] Executing command: ['/usr/bin/systemd-nspawn', '-q', '-M', '4db89a6cb0364804aec2945937739d77', '-D', '/var/lib/mock/f42-build-55737982-6538420/root', '-a', '-u', 'mockbuild', '--capability=cap_ipc_lock', '--bind=/tmp/mock-resolv.ch_as3uk:/etc/resolv.conf', '--bind=/dev/btrfs-control', '--bind=/dev/mapper/control', '--bind=/dev/fuse', '--bind=/dev/loop-control', '--bind=/dev/loop0', '--bind=/dev/loop1', '--bind=/dev/loop2', '--bind=/dev/loop3', '--bind=/dev/loop4', '--bind=/dev/loop5', '--bind=/dev/loop6', '--bind=/dev/loop7', '--bind=/dev/loop8', '--bind=/dev/loop9', '--bind=/dev/loop10', '--bind=/dev/loop11', '--console=pipe', '--setenv=TERM=vt100', '--setenv=SHELL=/bin/bash', '--setenv=HOME=/builddir', '--setenv=HOSTNAME=mock', '--setenv=PATH=/usr/bin:/bin:/usr/sbin:/sbin', '--setenv=PROMPT_COMMAND=printf "\\033]0;\\007"', '--setenv=PS1= \\s-\\v\\$ ', '--setenv=LANG=C.UTF-8', '--resolv-conf=off', 'bash', '--login', '-c', '/usr/bin/rpmbuild -bs --noclean --target x86_64 --nodeps /builddir/build/SPECS/rccl.spec'] with env {'TERM': 'vt100', 'SHELL': '/bin/bash', 'HOME': '/builddir', 'HOSTNAME': 'mock', 'PATH': '/usr/bin:/bin:/usr/sbin:/sbin', 'PROMPT_COMMAND': 'printf "\\033]0;\\007"', 'PS1': ' \\s-\\v\\$ ', 'LANG': 'C.UTF-8', 'SYSTEMD_NSPAWN_TMPFS_TMP': '0', 'SYSTEMD_SECCOMP': '0'} and shell False Building target platforms: x86_64 Building for target x86_64 setting SOURCE_DATE_EPOCH=1733788800 Wrote: /builddir/build/SRPMS/rccl-6.3.0-1.fc42.src.rpm Child return code was: 0 ENTER ['do_with_status'](['bash', '--login', '-c', '/usr/bin/rpmbuild -bb --noclean --target x86_64 --nodeps /builddir/build/SPECS/rccl.spec'], chrootPath='/var/lib/mock/f42-build-55737982-6538420/root'env={'TERM': 'vt100', 'SHELL': '/bin/bash', 'HOME': '/builddir', 'HOSTNAME': 'mock', 'PATH': '/usr/bin:/bin:/usr/sbin:/sbin', 'PROMPT_COMMAND': 'printf "\\033]0;\\007"', 'PS1': ' \\s-\\v\\$ ', 'LANG': 'C.UTF-8'}shell=Falselogger=timeout=201600uid=1000gid=425user='mockbuild'unshare_net=TrueprintOutput=Falsenspawn_args=['--capability=cap_ipc_lock', '--bind=/tmp/mock-resolv.ch_as3uk:/etc/resolv.conf', '--bind=/dev/btrfs-control', '--bind=/dev/mapper/control', '--bind=/dev/fuse', '--bind=/dev/loop-control', '--bind=/dev/loop0', '--bind=/dev/loop1', '--bind=/dev/loop2', '--bind=/dev/loop3', '--bind=/dev/loop4', '--bind=/dev/loop5', '--bind=/dev/loop6', '--bind=/dev/loop7', '--bind=/dev/loop8', '--bind=/dev/loop9', '--bind=/dev/loop10', '--bind=/dev/loop11']) Using nspawn with args ['--capability=cap_ipc_lock', '--bind=/tmp/mock-resolv.ch_as3uk:/etc/resolv.conf', '--bind=/dev/btrfs-control', '--bind=/dev/mapper/control', '--bind=/dev/fuse', '--bind=/dev/loop-control', '--bind=/dev/loop0', '--bind=/dev/loop1', '--bind=/dev/loop2', '--bind=/dev/loop3', '--bind=/dev/loop4', '--bind=/dev/loop5', '--bind=/dev/loop6', '--bind=/dev/loop7', '--bind=/dev/loop8', '--bind=/dev/loop9', '--bind=/dev/loop10', '--bind=/dev/loop11'] Executing command: ['/usr/bin/systemd-nspawn', '-q', '-M', '3644d22c50b44bf38063dfc7c0565cb0', '-D', '/var/lib/mock/f42-build-55737982-6538420/root', '-a', '-u', 'mockbuild', '--capability=cap_ipc_lock', '--bind=/tmp/mock-resolv.ch_as3uk:/etc/resolv.conf', '--bind=/dev/btrfs-control', '--bind=/dev/mapper/control', '--bind=/dev/fuse', '--bind=/dev/loop-control', '--bind=/dev/loop0', '--bind=/dev/loop1', '--bind=/dev/loop2', '--bind=/dev/loop3', '--bind=/dev/loop4', '--bind=/dev/loop5', '--bind=/dev/loop6', '--bind=/dev/loop7', '--bind=/dev/loop8', '--bind=/dev/loop9', '--bind=/dev/loop10', '--bind=/dev/loop11', '--console=pipe', '--setenv=TERM=vt100', '--setenv=SHELL=/bin/bash', '--setenv=HOME=/builddir', '--setenv=HOSTNAME=mock', '--setenv=PATH=/usr/bin:/bin:/usr/sbin:/sbin', '--setenv=PROMPT_COMMAND=printf "\\033]0;\\007"', '--setenv=PS1= \\s-\\v\\$ ', '--setenv=LANG=C.UTF-8', '--resolv-conf=off', 'bash', '--login', '-c', '/usr/bin/rpmbuild -bb --noclean --target x86_64 --nodeps /builddir/build/SPECS/rccl.spec'] with env {'TERM': 'vt100', 'SHELL': '/bin/bash', 'HOME': '/builddir', 'HOSTNAME': 'mock', 'PATH': '/usr/bin:/bin:/usr/sbin:/sbin', 'PROMPT_COMMAND': 'printf "\\033]0;\\007"', 'PS1': ' \\s-\\v\\$ ', 'LANG': 'C.UTF-8', 'SYSTEMD_NSPAWN_TMPFS_TMP': '0', 'SYSTEMD_SECCOMP': '0'} and shell False Building target platforms: x86_64 Building for target x86_64 setting SOURCE_DATE_EPOCH=1733788800 Executing(%mkbuilddir): /bin/sh -e /var/tmp/rpm-tmp.LLP9F1 + umask 022 + cd /builddir/build/BUILD/rccl-6.3.0-build + test -d /builddir/build/BUILD/rccl-6.3.0-build + /usr/bin/chmod -Rf a+rX,u+w,g-w,o-w /builddir/build/BUILD/rccl-6.3.0-build + /usr/bin/rm -rf /builddir/build/BUILD/rccl-6.3.0-build + /usr/bin/mkdir -p /builddir/build/BUILD/rccl-6.3.0-build + /usr/bin/mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/SPECPARTS + RPM_EC=0 ++ jobs -p + exit 0 Executing(%prep): /bin/sh -e /var/tmp/rpm-tmp.jWcVGX + umask 022 + cd /builddir/build/BUILD/rccl-6.3.0-build + cd /builddir/build/BUILD/rccl-6.3.0-build + rm -rf rccl-rocm-6.3.0 + /usr/lib/rpm/rpmuncompress -x /builddir/build/SOURCES/RCCL-6.3.0.tar.gz + STATUS=0 + '[' 0 -ne 0 ']' + cd rccl-rocm-6.3.0 + /usr/bin/chmod -Rf a+rX,u+w,g-w,o-w . + sed -i -e '/AMD GPU targets to compile for/d' CMakeLists.txt + sed -i -e 's@cat ${ROCM_PATH}/.info/version@echo 6.3.0@' CMakeLists.txt + sed -i -e s@rocm-core/rocm_version.h@rocm_version.h@ src/include/hip_rocm_version_info.h + RPM_EC=0 ++ jobs -p + exit 0 Executing(%build): /bin/sh -e /var/tmp/rpm-tmp.dEb8Z7 + umask 022 + cd /builddir/build/BUILD/rccl-6.3.0-build + CFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer ' + export CFLAGS + CXXFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer' + export CXXFLAGS + FFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -I/usr/lib64/gfortran/modules ' + export FFLAGS + FCFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -I/usr/lib64/gfortran/modules ' + export FCFLAGS + VALAFLAGS=-g + export VALAFLAGS + RUSTFLAGS='-Copt-level=3 -Cdebuginfo=2 -Ccodegen-units=1 -Cstrip=none -Cforce-frame-pointers=yes -Clink-arg=-specs=/usr/lib/rpm/redhat/redhat-package-notes --cap-lints=warn' + export RUSTFLAGS + LDFLAGS='-Wl,-z,relro -Wl,--as-needed -Wl,-z,pack-relative-relocs -Wl,-z,now -Wl,-z,now -Wl,--build-id=sha1 -specs=/usr/lib/rpm/redhat/redhat-package-notes ' + export LDFLAGS + LT_SYS_LIBRARY_PATH=/usr/lib64: + export LT_SYS_LIBRARY_PATH + CC=hipcc + export CC + CXX=hipcc + export CXX + cd rccl-rocm-6.3.0 + CFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer ' + export CFLAGS + CXXFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer' + export CXXFLAGS + FFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -I/usr/lib64/gfortran/modules ' + export FFLAGS + FCFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -I/usr/lib64/gfortran/modules ' + export FCFLAGS + VALAFLAGS=-g + export VALAFLAGS + RUSTFLAGS='-Copt-level=3 -Cdebuginfo=2 -Ccodegen-units=1 -Cstrip=none -Cforce-frame-pointers=yes -Clink-arg=-specs=/usr/lib/rpm/redhat/redhat-package-notes --cap-lints=warn' + export RUSTFLAGS + LDFLAGS='-Wl,-z,relro -Wl,--as-needed -Wl,-z,pack-relative-relocs -Wl,-z,now -Wl,-z,now -Wl,--build-id=sha1 -specs=/usr/lib/rpm/redhat/redhat-package-notes ' + export LDFLAGS + LT_SYS_LIBRARY_PATH=/usr/lib64: + export LT_SYS_LIBRARY_PATH + CC=hipcc + export CC + CXX=hipcc + export CXX + /usr/bin/cmake -S . -B redhat-linux-build -DCMAKE_C_FLAGS_RELEASE:STRING=-DNDEBUG -DCMAKE_CXX_FLAGS_RELEASE:STRING=-DNDEBUG -DCMAKE_Fortran_FLAGS_RELEASE:STRING=-DNDEBUG -DCMAKE_VERBOSE_MAKEFILE:BOOL=ON -DCMAKE_INSTALL_DO_STRIP:BOOL=OFF -DCMAKE_INSTALL_PREFIX:PATH=/usr -DINCLUDE_INSTALL_DIR:PATH=/usr/include -DLIB_INSTALL_DIR:PATH=/usr/lib64 -DSYSCONF_INSTALL_DIR:PATH=/etc -DSHARE_INSTALL_PREFIX:PATH=/usr/share -DLIB_SUFFIX=64 -DBUILD_SHARED_LIBS:BOOL=ON -DBUILD_TESTS=OFF -DCMAKE_CXX_COMPILER=/usr/bin/hipcc -DCMAKE_C_COMPILER=/usr/bin/hipcc -DCMAKE_BUILD_TYPE=RelWithDebInfo -DCMAKE_SKIP_RPATH=ON -DBUILD_FILE_REORG_BACKWARD_COMPATIBILITY=OFF -DCMAKE_INSTALL_LIBDIR=/usr/lib64 -DROCM_SYMLINK_LIBS=OFF -DAMDGPU_TARGETS=gfx1100 -DHIP_PLATFORM=amd -DRCCL_ROCPROFILER_REGISTER=OFF CMake Deprecation Warning at CMakeLists.txt:6 (cmake_minimum_required): Compatibility with CMake < 3.10 will be removed from a future version of CMake. Update the VERSION argument value. Or, use the ... syntax to tell CMake that the project requires at least but has been updated to work with policies introduced by or earlier. -- CMAKE_TOOLCHAIN_FILE: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/toolchain-linux.cmake -- The CXX compiler identification is Clang 18.0.0 -- Detecting CXX compiler ABI info -- Detecting CXX compiler ABI info - done -- Check for working CXX compiler: /usr/bin/hipcc - skipped -- Detecting CXX compile features -- Detecting CXX compile features - done -- Could NOT find GTest (missing: GTEST_LIBRARY GTEST_INCLUDE_DIR GTEST_MAIN_LIBRARY) (Required is at least version "1.11") -- Checking for ROCm support for GPU targets: gfx1100 -- Performing Test COMPILER_HAS_TARGET_ID_gfx1100 -- Performing Test COMPILER_HAS_TARGET_ID_gfx1100 - Success -- Compiling for gfx1100 -- Could NOT find GTest (missing: GTEST_LIBRARY GTEST_INCLUDE_DIR GTEST_MAIN_LIBRARY) (Required is at least version "1.11") -- ROCM_PATH found: /opt/rocm -- Compiling with hipcc -- Performing Test CMAKE_HAVE_LIBC_PTHREAD -- Performing Test CMAKE_HAVE_LIBC_PTHREAD - Success -- Found Threads: TRUE -- Performing Test HIP_CLANG_SUPPORTS_PARALLEL_JOBS -- Performing Test HIP_CLANG_SUPPORTS_PARALLEL_JOBS - Success -- HIP compiler: clang -- HIP runtime: rocclr -- hipcc executable: /usr/bin/hipcc sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory -- hipcc version: 6.3.42131 -- hipconfig executable: /usr/bin/hipconfig -- hipcc HIP version: 6.3.42131 -- ROCm version: 6.3.0 ******************************************************************************* *------------------------------- ROCMChecks WARNING --------------------------* Options and properties should be set on a cmake target where possible. The variable 'CMAKE_CXX_FLAGS' may be set by the cmake toolchain, either by calling 'cmake -DCMAKE_CXX_FLAGS="-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer"' or set in a toolchain file and added with 'cmake -DCMAKE_TOOLCHAIN_FILE='. ROCMChecks now calling: CMake Warning at /usr/share/rocmcmakebuildtools/cmake/ROCMChecks.cmake:46 (message): 'CMAKE_CXX_FLAGS' is set at /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/CMakeLists.txt: shown below: Call Stack (most recent call first): /usr/share/cmake/Modules/CheckSymbolExists.cmake:9223372036854775807 (rocm_check_toolchain_var) /usr/share/cmake/Modules/CheckSymbolExists.cmake:87 (string) /usr/share/cmake/Modules/CheckSymbolExists.cmake:71 (__CHECK_SYMBOL_EXISTS_FILTER_FLAGS) CMakeLists.txt:191 (check_symbol_exists) *-----------------------------------------------------------------------------* ******************************************************************************* ******************************************************************************* *------------------------------- ROCMChecks WARNING --------------------------* Options and properties should be set on a cmake target where possible. The variable 'CMAKE_CXX_FLAGS' may be set by the cmake toolchain, either by calling 'cmake -DCMAKE_CXX_FLAGS="-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer"' or set in a toolchain file and added with 'cmake -DCMAKE_TOOLCHAIN_FILE='. ROCMChecks now calling: CMake Warning at /usr/share/rocmcmakebuildtools/cmake/ROCMChecks.cmake:46 (message): 'CMAKE_CXX_FLAGS' is set at /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/CMakeLists.txt: shown below: Call Stack (most recent call first): /usr/share/cmake/Modules/CheckSymbolExists.cmake:9223372036854775807 (rocm_check_toolchain_var) /usr/share/cmake/Modules/CheckSymbolExists.cmake:88 (string) /usr/share/cmake/Modules/CheckSymbolExists.cmake:71 (__CHECK_SYMBOL_EXISTS_FILTER_FLAGS) CMakeLists.txt:191 (check_symbol_exists) *-----------------------------------------------------------------------------* ******************************************************************************* -- Looking for hipDeviceMallocUncached -- Looking for hipDeviceMallocUncached - found ******************************************************************************* *------------------------------- ROCMChecks WARNING --------------------------* Options and properties should be set on a cmake target where possible. The variable 'CMAKE_CXX_FLAGS' may be set by the cmake toolchain, either by calling 'cmake -DCMAKE_CXX_FLAGS="-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer"' or set in a toolchain file and added with 'cmake -DCMAKE_TOOLCHAIN_FILE='. ROCMChecks now calling: CMake Warning at /usr/share/rocmcmakebuildtools/cmake/ROCMChecks.cmake:46 (message): 'CMAKE_CXX_FLAGS' is set at /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/CMakeLists.txt: shown below: Call Stack (most recent call first): /usr/share/cmake/Modules/CheckSymbolExists.cmake:9223372036854775807 (rocm_check_toolchain_var) /usr/share/cmake/Modules/CheckSymbolExists.cmake:99 (set) /usr/share/cmake/Modules/CheckSymbolExists.cmake:73 (__CHECK_SYMBOL_EXISTS_RESTORE_FLAGS) CMakeLists.txt:191 (check_symbol_exists) *-----------------------------------------------------------------------------* ******************************************************************************* ******************************************************************************* *------------------------------- ROCMChecks WARNING --------------------------* Options and properties should be set on a cmake target where possible. The variable 'CMAKE_CXX_FLAGS' may be set by the cmake toolchain, either by calling 'cmake -DCMAKE_CXX_FLAGS="-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer"' or set in a toolchain file and added with 'cmake -DCMAKE_TOOLCHAIN_FILE='. ROCMChecks now calling: CMake Warning at /usr/share/rocmcmakebuildtools/cmake/ROCMChecks.cmake:46 (message): 'CMAKE_CXX_FLAGS' is set at /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/CMakeLists.txt: shown below: Call Stack (most recent call first): /usr/share/cmake/Modules/CheckSymbolExists.cmake:9223372036854775807 (rocm_check_toolchain_var) /usr/share/cmake/Modules/CheckSymbolExists.cmake:87 (string) /usr/share/cmake/Modules/CheckSymbolExists.cmake:71 (__CHECK_SYMBOL_EXISTS_FILTER_FLAGS) CMakeLists.txt:194 (check_symbol_exists) *-----------------------------------------------------------------------------* ******************************************************************************* ******************************************************************************* *------------------------------- ROCMChecks WARNING --------------------------* Options and properties should be set on a cmake target where possible. The variable 'CMAKE_CXX_FLAGS' may be set by the cmake toolchain, either by calling 'cmake -DCMAKE_CXX_FLAGS="-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer"' or set in a toolchain file and added with 'cmake -DCMAKE_TOOLCHAIN_FILE='. ROCMChecks now calling: CMake Warning at /usr/share/rocmcmakebuildtools/cmake/ROCMChecks.cmake:46 (message): 'CMAKE_CXX_FLAGS' is set at /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/CMakeLists.txt: shown below: Call Stack (most recent call first): /usr/share/cmake/Modules/CheckSymbolExists.cmake:9223372036854775807 (rocm_check_toolchain_var) /usr/share/cmake/Modules/CheckSymbolExists.cmake:88 (string) /usr/share/cmake/Modules/CheckSymbolExists.cmake:71 (__CHECK_SYMBOL_EXISTS_FILTER_FLAGS) CMakeLists.txt:194 (check_symbol_exists) *-----------------------------------------------------------------------------* ******************************************************************************* -- Looking for hipDeviceMallocContiguous -- Looking for hipDeviceMallocContiguous - found ******************************************************************************* *------------------------------- ROCMChecks WARNING --------------------------* Options and properties should be set on a cmake target where possible. The variable 'CMAKE_CXX_FLAGS' may be set by the cmake toolchain, either by calling 'cmake -DCMAKE_CXX_FLAGS="-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer"' or set in a toolchain file and added with 'cmake -DCMAKE_TOOLCHAIN_FILE='. ROCMChecks now calling: CMake Warning at /usr/share/rocmcmakebuildtools/cmake/ROCMChecks.cmake:46 (message): 'CMAKE_CXX_FLAGS' is set at /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/CMakeLists.txt: shown below: Call Stack (most recent call first): /usr/share/cmake/Modules/CheckSymbolExists.cmake:9223372036854775807 (rocm_check_toolchain_var) /usr/share/cmake/Modules/CheckSymbolExists.cmake:99 (set) /usr/share/cmake/Modules/CheckSymbolExists.cmake:73 (__CHECK_SYMBOL_EXISTS_RESTORE_FLAGS) CMakeLists.txt:194 (check_symbol_exists) *-----------------------------------------------------------------------------* ******************************************************************************* -- RCCL LL128 protocol enabled -- HSA runtime: /usr/include -- Found rocm_smi at /usr/include -- Looking for C++ include /usr/include/rocm_smi/rocm_smi64Config.h -- Looking for C++ include /usr/include/rocm_smi/rocm_smi64Config.h - found -- RSMI_INIT_FLAG_THRAD_ONLY_MUTEX supported -- Performing Test HAVE_KERNARG_PRELOAD -- Performing Test HAVE_KERNARG_PRELOAD - Success -- Kernarg preloading to SGPR enabled CMake Warning at CMakeLists.txt:301 (message): Can only build MSCCL++ for gfx942; disabling MSCCL++ build -- Found Python3: /usr/bin/python3.13 (found version "3.13.1") found components: Interpreter -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/device_table.h -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/device_table.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/host_table.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp -- Generating /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp -- HIP_CONTIGUOUS_MEMORY enabled -- HIP_UNCACHED_MEMORY enabled cat: /sys/fs/cgroup/memory/memory.limit_in_bytes: No such file or directory -- Use 8 jobs for linking -- Building shared RCCL library -- rocm-cmake: Set license file to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/LICENSE.txt. -- Configuring done (20.6s) -- Generating done (0.1s) CMake Warning: Manually-specified variables were not used by the project: CMAKE_CXX_FLAGS_RELEASE CMAKE_C_FLAGS_RELEASE CMAKE_Fortran_FLAGS_RELEASE CMAKE_INSTALL_DO_STRIP LIB_SUFFIX SHARE_INSTALL_PREFIX SYSCONF_INSTALL_DIR -- Build files have been written to: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build + /usr/bin/cmake --build redhat-linux-build -j48 --verbose Change Dir: '/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build' Run Build Command(s): /usr/bin/cmake -E env VERBOSE=1 /usr/bin/gmake -f Makefile -j48 /usr/bin/cmake -S/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0 -B/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build --check-build-system CMakeFiles/Makefile.cmake 0 /usr/bin/cmake -E cmake_progress_start /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/CMakeFiles /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build//CMakeFiles/progress.marks /usr/bin/gmake -f CMakeFiles/Makefile2 all gmake[1]: Entering directory '/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build' /usr/bin/gmake -f CMakeFiles/git_version_check.dir/build.make CMakeFiles/git_version_check.dir/depend gmake[2]: Entering directory '/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build' cd /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0 /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0 /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/CMakeFiles/git_version_check.dir/DependInfo.cmake "--color=" gmake[2]: Leaving directory '/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build' /usr/bin/gmake -f CMakeFiles/git_version_check.dir/build.make CMakeFiles/git_version_check.dir/build gmake[2]: Entering directory '/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build' [ 0%] Updating git_version.cpp if necessary /usr/bin/cmake -P /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/git_version.cmake -- Updating git_version.cpp gmake[2]: Leaving directory '/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build' [ 0%] Built target git_version_check /usr/bin/gmake -f CMakeFiles/rccl.dir/build.make CMakeFiles/rccl.dir/depend gmake[2]: Entering directory '/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build' [ 0%] Hipifying src/bootstrap.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/bootstrap.cc [ 1%] Hipifying src/transport/shm.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/shm.cc [ 2%] Hipifying src/collectives.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/transport/shm.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/shm.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/shm.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/bootstrap.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/bootstrap.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/bootstrap.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/collectives.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc [ 3%] Hipifying src/device/all_reduce.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h [ 3%] Hipifying src/channel.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc [ 3%] Hipifying src/device/all_gather.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h [ 3%] Hipifying src/device/onerank.cu -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/onerank.cu.cpp mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/all_reduce.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h [ 3%] Hipifying src/debug.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/debug.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/channel.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/all_gather.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/onerank.cu -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/onerank.cu.cpp && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/onerank.cu.cpp [ 3%] Hipifying src/device/msccl_kernel_impl.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h [ 3%] Hipifying src/device/broadcast.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/debug.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/debug.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/debug.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/msccl_kernel_impl.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h [ 5%] Hipifying src/device/network/unpack/unpack_defs.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack/unpack_defs.h [ 3%] Hipifying src/device/alltoall_pivot.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h [ 5%] Hipifying src/device/common_kernel.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common_kernel.h [ 5%] Hipifying src/device/common.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h [ 5%] Hipifying src/device/reduce.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/broadcast.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h [ 5%] Hipifying src/device/common.cu -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.cu.cpp mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/alltoall_pivot.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/common_kernel.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common_kernel.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common_kernel.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/common.cu -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.cu.cpp && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.cu.cpp [ 5%] Hipifying src/device/prims_ll128.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h [ 5%] Hipifying src/device/primitives.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/common.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/network/unpack/unpack_defs.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack/unpack_defs.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack/unpack_defs.h [ 5%] Hipifying src/device/network/unpack/unpack.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack/unpack.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/reduce.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h [ 6%] Hipifying src/device/prims_ll.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/primitives.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h [ 6%] Hipifying src/device/op128.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/op128.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/prims_ll128.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/network/unpack/unpack.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack/unpack.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack/unpack.h [ 7%] Hipifying src/device/reduce_scatter.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/op128.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/op128.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/op128.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/prims_ll.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h [ 7%] Hipifying src/enqueue.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc [ 7%] Hipifying src/device/reduce_kernel.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_kernel.h [ 7%] Hipifying src/device/prims_simple.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/reduce_scatter.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h [ 7%] Hipifying src/graph/rings.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rings.h [ 7%] Hipifying src/graph/paths.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc [ 7%] Hipifying src/device/sendrecv.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h [ 8%] Hipifying src/graph/rings.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rings.cc [ 9%] Hipifying src/graph/rome_models.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.h [ 9%] Hipifying src/graph/search.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc [ 9%] Hipifying src/graph/connect.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc [ 9%] Hipifying src/graph/rome_models.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/prims_simple.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h [ 9%] Hipifying src/graph/topo.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/reduce_kernel.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_kernel.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_kernel.h [ 9%] Hipifying src/graph/trees.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/trees.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/device/sendrecv.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h [ 9%] Hipifying src/graph/topo.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/enqueue.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/graph/connect.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/graph/paths.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc [ 10%] Hipifying src/graph/tuning.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc [ 10%] Hipifying src/graph/xml.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/graph/rings.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rings.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rings.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/graph/rings.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rings.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rings.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/graph/rome_models.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc [ 10%] Hipifying src/graph/xml.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/graph/rome_models.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/graph/search.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc [ 11%] Hipifying src/include/alloc.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h [ 11%] Hipifying src/include/align.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/align.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/graph/topo.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/graph/topo.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h [ 11%] Hipifying src/group.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/graph/trees.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/trees.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/trees.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/graph/tuning.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc [ 11%] Hipifying src/include/BfdBacktrace.hpp -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/BfdBacktrace.hpp mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/graph/xml.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.cc [ 11%] Hipifying src/include/alt_rsmi.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alt_rsmi.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/graph/xml.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h [ 11%] Hipifying src/include/api_trace.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/api_trace.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/group.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc [ 11%] Hipifying src/include/archinfo.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/archinfo.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/BfdBacktrace.hpp -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/BfdBacktrace.hpp && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/BfdBacktrace.hpp mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/align.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/align.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/align.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/alloc.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/alt_rsmi.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alt_rsmi.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alt_rsmi.h [ 12%] Hipifying src/include/argcheck.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/api_trace.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/api_trace.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/api_trace.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/archinfo.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/archinfo.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/archinfo.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/argcheck.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h [ 12%] Hipifying src/include/bootstrap.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/bootstrap.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/bootstrap.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/bootstrap.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/bootstrap.h [ 12%] Hipifying src/include/channel.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/channel.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h [ 13%] Hipifying src/include/checks.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/checks.h [ 13%] Hipifying src/include/coll_net.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/checks.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/checks.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/checks.h [ 13%] Hipifying src/include/collectives.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/collectives.h [ 13%] Hipifying src/include/comm.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/coll_net.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/collectives.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/collectives.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/collectives.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack/unpack_defs.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/comm.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h [ 14%] Hipifying src/include/core.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h [ 14%] Hipifying src/include/cpuset.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/cpuset.h [ 14%] Hipifying src/include/debug.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/debug.h [ 14%] Hipifying src/include/device.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/core.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/cpuset.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/cpuset.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/cpuset.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/debug.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/debug.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/debug.h [ 15%] Hipifying src/include/enqueue.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/device.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/enqueue.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h [ 15%] Hipifying src/include/gdrwrap.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h [ 15%] Hipifying src/include/git_version.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/git_version.h [ 15%] Hipifying src/include/graph.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/gdrwrap.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/git_version.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/git_version.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/git_version.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/graph.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h [ 16%] Hipifying src/include/group.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/group.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/group.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/group.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/group.h [ 16%] Hipifying src/include/hip_rocm_version_info.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/hip_rocm_version_info.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/hip_rocm_version_info.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/hip_rocm_version_info.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/hip_rocm_version_info.h [ 16%] Hipifying src/include/ibvsymbols.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ibvsymbols.h [ 16%] Hipifying src/include/ibvcore.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ibvcore.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/ibvsymbols.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ibvsymbols.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ibvsymbols.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/ibvcore.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ibvcore.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ibvcore.h [ 17%] Hipifying src/include/ibvwrap.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ibvwrap.h [ 17%] Hipifying src/include/info.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/ibvwrap.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ibvwrap.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ibvwrap.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack/unpack.h [ 17%] Hipifying src/include/ipcsocket.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ipcsocket.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/info.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/ipcsocket.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ipcsocket.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ipcsocket.h [ 17%] Hipifying src/include/msccl/msccl_kernel.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_kernel.h [ 17%] Hipifying src/include/msccl/msccl_lifecycle.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_lifecycle.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/msccl/msccl_kernel.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_kernel.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_kernel.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/msccl/msccl_lifecycle.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_lifecycle.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_lifecycle.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common_kernel.h [ 18%] Hipifying src/include/msccl/msccl_parser.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/msccl/msccl_parser.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h [ 18%] Hipifying src/include/msccl/msccl_scheduler.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_scheduler.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/msccl/msccl_scheduler.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_scheduler.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_scheduler.h [ 18%] Hipifying src/include/msccl/msccl_setup.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_setup.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/msccl/msccl_setup.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_setup.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_setup.h [ 18%] Hipifying src/include/msccl/msccl_status.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_status.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/msccl/msccl_status.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_status.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_status.h [ 19%] Hipifying src/include/msccl/msccl_struct.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/msccl/msccl_struct.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h [ 19%] Hipifying src/include/nccl_common.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nccl_common.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nccl_common.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nccl_common.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nccl_common.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h [ 20%] Hipifying src/include/nccl_tuner.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nccl_tuner.h [ 20%] Hipifying src/include/nccl_net.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nccl_net.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nccl_net.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nccl_net.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nccl_net.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/op128.h [ 20%] Hipifying src/include/net.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nccl_tuner.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nccl_tuner.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nccl_tuner.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/net.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h [ 20%] Hipifying src/include/net_device.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net_device.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/net_device.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net_device.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net_device.h [ 20%] Hipifying src/include/npkit/npkit.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit/npkit.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/npkit/npkit.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit/npkit.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit/npkit.h [ 20%] Hipifying src/include/npkit/npkit_event.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit/npkit_event.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/npkit/npkit_event.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit/npkit_event.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit/npkit_event.h [ 20%] Hipifying src/include/nvtx.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx.h [ 20%] Hipifying src/include/npkit/npkit_struct.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit/npkit_struct.h [ 21%] Hipifying src/include/nvmlwrap.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvmlwrap.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/npkit/npkit_struct.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit/npkit_struct.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit/npkit_struct.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvmlwrap.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvmlwrap.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvmlwrap.h [ 21%] Hipifying src/include/nvtx3/nvToolsExt.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExt.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_kernel.h [ 22%] Hipifying src/include/nvtx3/nvToolsExtCuda.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtCuda.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvToolsExt.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExt.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExt.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvToolsExtCuda.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtCuda.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtCuda.h [ 22%] Hipifying src/include/nvtx3/nvToolsExtCudaRt.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtCudaRt.h [ 22%] Hipifying src/include/nvtx3/nvToolsExtOpenCL.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtOpenCL.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvToolsExtCudaRt.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtCudaRt.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtCudaRt.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvToolsExtOpenCL.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtOpenCL.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtOpenCL.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h Added COLL_UNROLL template argument to /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h [ 23%] Hipifying src/include/nvtx3/nvToolsExtPayload.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtPayload.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvToolsExtPayload.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtPayload.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtPayload.h [ 23%] Hipifying src/include/nvtx3/nvToolsExtSync.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtSync.h [ 23%] Hipifying src/include/nvtx3/nvtx3.hpp -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp [ 23%] Hipifying src/include/nvtx3/nvtxDetail/nvtxImpl.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImpl.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvToolsExtSync.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtSync.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvToolsExtSync.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxDetail/nvtxImpl.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImpl.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImpl.h [ 23%] Hipifying src/include/nvtx3/nvtxDetail/nvtxImplCore.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCore.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtx3.hpp -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxDetail/nvtxImplCore.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCore.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCore.h [ 24%] Hipifying src/include/nvtx3/nvtxDetail/nvtxImplCudaRt_v3.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCudaRt_v3.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxDetail/nvtxImplCudaRt_v3.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCudaRt_v3.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCudaRt_v3.h [ 24%] Hipifying src/include/nvtx3/nvtxDetail/nvtxImplCuda_v3.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCuda_v3.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxDetail/nvtxImplCuda_v3.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCuda_v3.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCuda_v3.h [ 24%] Hipifying src/include/nvtx3/nvtxDetail/nvtxImplOpenCL_v3.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplOpenCL_v3.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxDetail/nvtxImplOpenCL_v3.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplOpenCL_v3.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplOpenCL_v3.h [ 25%] Hipifying src/include/nvtx3/nvtxDetail/nvtxImplSync_v3.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplSync_v3.h [ 25%] Hipifying src/include/nvtx3/nvtxDetail/nvtxInitDecls.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxInitDecls.h [ 25%] Hipifying src/include/nvtx3/nvtxDetail/nvtxInit.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxInit.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxDetail/nvtxImplSync_v3.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplSync_v3.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxImplSync_v3.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxDetail/nvtxInit.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxInit.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxInit.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxDetail/nvtxInitDecls.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxInitDecls.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxInitDecls.h [ 25%] Hipifying src/include/nvtx3/nvtxDetail/nvtxInitDefs.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxInitDefs.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxDetail/nvtxInitDefs.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxInitDefs.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxInitDefs.h [ 26%] Hipifying src/include/nvtx3/nvtxDetail/nvtxLinkOnce.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxLinkOnce.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxDetail/nvtxLinkOnce.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxLinkOnce.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxLinkOnce.h [ 26%] Hipifying src/include/nvtx3/nvtxDetail/nvtxTypes.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxTypes.h [ 26%] Hipifying src/include/nvtx3/nvtxExtDetail/nvtxExtImpl.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtImpl.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxDetail/nvtxTypes.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxTypes.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxDetail/nvtxTypes.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxExtDetail/nvtxExtImpl.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtImpl.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtImpl.h [ 26%] Hipifying src/include/nvtx3/nvtxExtDetail/nvtxExtImplPayload_v1.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtImplPayload_v1.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxExtDetail/nvtxExtImplPayload_v1.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtImplPayload_v1.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtImplPayload_v1.h [ 27%] Hipifying src/include/nvtx3/nvtxExtDetail/nvtxExtInit.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtInit.h [ 27%] Hipifying src/include/nvtx3/nvtxExtDetail/nvtxExtPayloadTypeInfo.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtPayloadTypeInfo.h [ 27%] Hipifying src/include/nvtx3/nvtxExtDetail/nvtxExtTypes.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtTypes.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxExtDetail/nvtxExtInit.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtInit.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtInit.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxExtDetail/nvtxExtPayloadTypeInfo.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtPayloadTypeInfo.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtPayloadTypeInfo.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx3/nvtxExtDetail/nvtxExtTypes.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtTypes.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtTypes.h [ 27%] Hipifying src/include/nvtx_stub.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx_stub.h [ 27%] Hipifying src/include/p2p.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/p2p.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/nvtx_stub.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx_stub.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx_stub.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/p2p.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/p2p.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/p2p.h [ 28%] Hipifying src/include/param.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/param.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/param.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/param.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/param.h [ 28%] Hipifying src/include/profiler.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/profiler.h [ 28%] Hipifying src/include/proxy.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/proxy.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/profiler.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/profiler.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/profiler.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/proxy.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/proxy.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/proxy.h [ 28%] Hipifying src/include/rccl_float8.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h [ 28%] Hipifying src/include/rccl_vars.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_vars.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/rccl_float8.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/rccl_vars.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_vars.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_vars.h [ 28%] Hipifying src/include/rocm_smi_wrap.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rocm_smi_wrap.h [ 30%] Hipifying src/include/register.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/register.h [ 30%] Hipifying src/include/roctx.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h [ 30%] Hipifying src/include/rocmwrap.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rocmwrap.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/rocm_smi_wrap.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rocm_smi_wrap.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rocm_smi_wrap.h [ 30%] Hipifying src/include/shm.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/shm.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/register.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/register.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/register.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/rocmwrap.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rocmwrap.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rocmwrap.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/roctx.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/shm.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/shm.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/shm.h [ 30%] Hipifying src/include/signals.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/signals.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/signals.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/signals.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/signals.h [ 30%] Hipifying src/include/socket.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/socket.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/socket.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/socket.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/socket.h [ 31%] Hipifying src/include/strongstream.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/strongstream.h [ 31%] Hipifying src/include/timer.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/timer.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/strongstream.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/strongstream.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/strongstream.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/timer.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/timer.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/timer.h [ 31%] Hipifying src/include/transport.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/transport.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h [ 32%] Hipifying src/include/trees.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/trees.h [ 32%] Hipifying src/include/tuner.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/tuner.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/trees.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/trees.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/trees.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/tuner.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/tuner.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/tuner.h [ 32%] Hipifying src/include/utils.h -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h [ 33%] Hipifying src/init.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/include/utils.h -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/init.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc [ 33%] Hipifying src/init_nvtx.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/init_nvtx.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc [ 34%] Hipifying src/misc/alt_rsmi.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/alt_rsmi.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc [ 35%] Hipifying src/misc/api_trace.c -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/api_trace.c [ 35%] Hipifying src/misc/api_trace.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/api_trace.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/api_trace.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/api_trace.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/api_trace.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/api_trace.c -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/api_trace.c && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/api_trace.c [ 35%] Hipifying src/misc/archinfo.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/archinfo.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/archinfo.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/archinfo.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/archinfo.cc [ 35%] Hipifying src/misc/argcheck.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/argcheck.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/argcheck.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/argcheck.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/argcheck.cc [ 35%] Hipifying src/misc/ibvsymbols.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvsymbols.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/ibvsymbols.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvsymbols.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvsymbols.cc [ 35%] Hipifying src/misc/ibvwrap.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvwrap.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/ibvwrap.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvwrap.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvwrap.cc [ 35%] Hipifying src/misc/ipcsocket.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ipcsocket.cc [ 35%] Hipifying src/misc/msccl/msccl_lifecycle.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/ipcsocket.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ipcsocket.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ipcsocket.cc [ 35%] Hipifying src/misc/msccl/msccl_parser.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/msccl/msccl_lifecycle.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/msccl/msccl_parser.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc [ 36%] Hipifying src/misc/msccl/msccl_setup.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/msccl/msccl_setup.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc [ 36%] Hipifying src/misc/msccl/msccl_status.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/msccl/msccl_status.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc [ 37%] Hipifying src/misc/npkit.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/npkit.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/npkit.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/npkit.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/npkit.cc [ 37%] Hipifying src/misc/nvmlwrap_stub.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/nvmlwrap_stub.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/nvmlwrap_stub.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/nvmlwrap_stub.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/nvmlwrap_stub.cc [ 37%] Hipifying src/misc/param.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/param.cc [ 37%] Hipifying src/misc/profiler.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/profiler.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/profiler.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/profiler.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/profiler.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/param.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/param.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/param.cc [ 38%] Hipifying src/misc/rocm_smi_wrap.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/rocm_smi_wrap.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc [ 38%] Hipifying src/misc/rocmwrap.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/rocmwrap.cc [ 39%] Hipifying src/misc/shmutils.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/shmutils.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/rocmwrap.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/rocmwrap.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/rocmwrap.cc [ 39%] Hipifying src/misc/roctx.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/roctx.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/shmutils.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/shmutils.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/shmutils.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/roctx.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/roctx.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/roctx.cc [ 39%] Hipifying src/misc/signals.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/signals.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/signals.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/signals.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/signals.cc [ 39%] Hipifying src/misc/strongstream.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/strongstream.cc [ 39%] Hipifying src/misc/socket.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/socket.cc [ 40%] Hipifying src/misc/tuner.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/tuner.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/strongstream.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/strongstream.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/strongstream.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/socket.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/socket.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/socket.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/tuner.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/tuner.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/tuner.cc [ 40%] Hipifying src/misc/utils.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/utils.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/misc/utils.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/utils.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/utils.cc [ 40%] Hipifying src/msccl.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc [ 40%] Hipifying src/net.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/net.cc [ 40%] Hipifying src/register.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/register.cc [ 41%] Hipifying src/proxy.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/proxy.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/msccl.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc [ 41%] Hipifying src/transport.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport.cc [ 41%] Hipifying src/transport/coll_net.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/net.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/net.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/net.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/proxy.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/proxy.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/proxy.cc [ 42%] Hipifying src/transport/net_ib.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/register.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/register.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/register.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/transport.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/transport/coll_net.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/transport/net_ib.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc [ 42%] Hipifying src/transport/net_socket.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_socket.cc [ 42%] Hipifying src/transport/net.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc [ 42%] Hipifying src/transport/p2p.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/transport/net_socket.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_socket.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_socket.cc [ 42%] Hipifying src/transport/nvls.cc -> /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/nvls.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/transport/net.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/transport/p2p.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/src/transport/nvls.cc -o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/nvls.cc && /usr/bin/cmake -E env bash /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/cmake/scripts/add_unroll.sh /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/nvls.cc cd /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build && /usr/bin/cmake -E cmake_depends "Unix Makefiles" /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0 /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0 /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/CMakeFiles/rccl.dir/DependInfo.cmake "--color=" gmake[2]: Leaving directory '/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build' /usr/bin/gmake -f CMakeFiles/rccl.dir/build.make CMakeFiles/rccl.dir/build gmake[2]: Entering directory '/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build' [ 42%] Building CXX object CMakeFiles/rccl.dir/hipify/src/bootstrap.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/bootstrap.cc.o -MF CMakeFiles/rccl.dir/hipify/src/bootstrap.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/bootstrap.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/bootstrap.cc [ 42%] Building CXX object CMakeFiles/rccl.dir/hipify/src/debug.cc.o [ 42%] Building CXX object CMakeFiles/rccl.dir/hipify/src/collectives.cc.o [ 43%] Building CXX object CMakeFiles/rccl.dir/hipify/src/group.cc.o [ 43%] Building CXX object CMakeFiles/rccl.dir/hipify/src/init_nvtx.cc.o [ 44%] Building CXX object CMakeFiles/rccl.dir/hipify/src/net.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives.cc.o -MF CMakeFiles/rccl.dir/hipify/src/collectives.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc [ 44%] Building CXX object CMakeFiles/rccl.dir/hipify/src/channel.cc.o [ 44%] Building CXX object CMakeFiles/rccl.dir/hipify/src/enqueue.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/debug.cc.o -MF CMakeFiles/rccl.dir/hipify/src/debug.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/debug.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/debug.cc /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/group.cc.o -MF CMakeFiles/rccl.dir/hipify/src/group.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/group.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/channel.cc.o -MF CMakeFiles/rccl.dir/hipify/src/channel.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/channel.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc [ 45%] Building CXX object CMakeFiles/rccl.dir/hipify/src/device/common.cu.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/enqueue.cc.o -MF CMakeFiles/rccl.dir/hipify/src/enqueue.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/enqueue.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc [ 45%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/init_nvtx.cc.o -MF CMakeFiles/rccl.dir/hipify/src/init_nvtx.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/init_nvtx.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc [ 45%] Building CXX object CMakeFiles/rccl.dir/hipify/src/init.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/net.cc.o -MF CMakeFiles/rccl.dir/hipify/src/net.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/net.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/net.cc [ 46%] Building CXX object CMakeFiles/rccl.dir/hipify/src/msccl.cc.o [ 46%] Building CXX object CMakeFiles/rccl.dir/hipify/src/register.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport.cc [ 46%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/topo.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/init.cc.o -MF CMakeFiles/rccl.dir/hipify/src/init.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/init.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/msccl.cc.o -MF CMakeFiles/rccl.dir/hipify/src/msccl.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/msccl.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/register.cc.o -MF CMakeFiles/rccl.dir/hipify/src/register.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/register.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/register.cc /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/common.cu.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/common.cu.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/common.cu.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.cu.cpp /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/topo.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/topo.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/topo.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc [ 46%] Building CXX object CMakeFiles/rccl.dir/hipify/src/device/onerank.cu.cpp.o [ 46%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/connect.cc.o [ 46%] Building CXX object CMakeFiles/rccl.dir/hipify/src/proxy.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/onerank.cu.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/onerank.cu.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/onerank.cu.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/onerank.cu.cpp [ 46%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/rome_models.cc.o [ 46%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/tuning.cc.o [ 47%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/rings.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/proxy.cc.o -MF CMakeFiles/rccl.dir/hipify/src/proxy.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/proxy.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/proxy.cc /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/connect.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/connect.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/connect.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/rome_models.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/rome_models.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/rome_models.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/tuning.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/tuning.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/tuning.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/rings.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/rings.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/rings.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rings.cc [ 47%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/paths.cc.o [ 47%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/search.cc.o [ 48%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/trees.cc.o [ 49%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/nvmlwrap_stub.cc.o [ 49%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/alt_rsmi.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/paths.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/paths.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/paths.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc [ 49%] Building CXX object CMakeFiles/rccl.dir/hipify/src/graph/xml.cc.o [ 50%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/ibvsymbols.cc.o [ 50%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/ibvwrap.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/search.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/search.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/search.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc [ 51%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/archinfo.cc.o [ 51%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/argcheck.cc.o [ 51%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/npkit.cc.o [ 51%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/api_trace.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/trees.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/trees.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/trees.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/trees.cc [ 51%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/rocm_smi_wrap.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/xml.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/xml.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/xml.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.cc /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/alt_rsmi.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/alt_rsmi.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/alt_rsmi.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/archinfo.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/archinfo.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/archinfo.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/archinfo.cc [ 51%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/ipcsocket.cc.o [ 51%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/profiler.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/ibvsymbols.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/ibvsymbols.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/ibvsymbols.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvsymbols.cc /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/argcheck.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/argcheck.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/argcheck.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/argcheck.cc [ 51%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/param.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/api_trace.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/api_trace.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/api_trace.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/api_trace.cc /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/ibvwrap.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/ibvwrap.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/ibvwrap.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvwrap.cc /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/ipcsocket.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/ipcsocket.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/ipcsocket.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ipcsocket.cc [ 52%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/rocmwrap.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/npkit.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/npkit.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/npkit.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/npkit.cc /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/nvmlwrap_stub.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/nvmlwrap_stub.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/nvmlwrap_stub.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/nvmlwrap_stub.cc /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/profiler.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/profiler.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/profiler.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/profiler.cc /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/rocm_smi_wrap.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/rocm_smi_wrap.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/rocm_smi_wrap.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/param.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/param.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/param.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/param.cc [ 52%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/roctx.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/rocmwrap.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/rocmwrap.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/rocmwrap.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/rocmwrap.cc /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/roctx.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/roctx.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/roctx.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/roctx.cc [ 52%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/signals.cc.o [ 52%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/shmutils.cc.o [ 53%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/socket.cc.o [ 52%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/strongstream.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/signals.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/signals.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/signals.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/signals.cc /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/shmutils.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/shmutils.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/shmutils.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/shmutils.cc [ 53%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/tuner.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/strongstream.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/strongstream.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/strongstream.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/strongstream.cc [ 53%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/utils.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/socket.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/socket.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/socket.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/socket.cc [ 53%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_parser.cc.o [ 54%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_lifecycle.cc.o [ 54%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_setup.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/tuner.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/tuner.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/tuner.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/tuner.cc [ 54%] Building CXX object CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_status.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/utils.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/utils.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/utils.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/utils.cc /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_lifecycle.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_lifecycle.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_lifecycle.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_parser.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_parser.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_parser.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_setup.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_setup.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_setup.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_status.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_status.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_status.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvwrap.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ibvwrap.h:21: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:272:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 272 | int intermediateIndex = -1; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:459:24: warning: unused variable 'gpu' [-Wunused-variable] 459 | struct ncclTopoNode* gpu = system->nodes[GPU].nodes+g; | ^~~ 1 warning generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/proxy.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 2 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/bootstrap.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/bootstrap.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/debug.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.cu.cpp:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | statIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvwrap.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/ibvwrap.h:21: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ ic float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 30 warnings generated when compiling for gfx1100. 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:23: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx.h:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvsymbols.cc:67: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/bootstrap.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1044:7: warning: unused variable 'nChannels' [-Wunused-variable] 1044 | int nChannels = 0; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1054:12: warning: unused variable 'y' [-Wunused-variable] 1054 | int x=0, y=0; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:14: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1563 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:14: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1538:7: note: declared here 1538 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:24: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1563 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:24: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1538:7: note: declared here 1538 | int ngpus In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: = system->nodes[GPwarning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ U].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1535:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1535 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1554:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1554 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1625:9: warning: unused variable 't' [-Wunused-variable] 1625 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1712:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1712 | static char ringRemap[64]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1716:7: warning: unused variable 'ncpus' [-Wunused-variable] 1716 | int ncpus = system->nodes[CPU].17 warnings generated when compiling for gfx1100. count; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1809:9: warning: unused variable 't' [-Wunused-variable] 1809 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1892:11: warning: 'NUMA_CPUS' macro redefined [-Wmacro-redefined] 1892 | #define NUMA_CPUS 4 | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1530:11: note: previous definition is here 1530 | #define NUMA_CPUS 2 | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1895:11: warning: 'TOTAL_PERMUTE_COUNT' macro redefined [-Wmacro-redefined] 1895 | #define TOTAL_PERMUTE_COUNT (NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1533:11: note: previous definition is here 1533 | #define TOTAL_PERMUTE_COUNT (NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:14: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1927 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:14: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1900:7: note: declared here 1900 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:24: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1927 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:24: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1900:7: note: declared here 1900 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1897:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1897 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1918:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1918 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1993:9: warning: unused variable 't' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1993 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:15: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 2051 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:15: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2034:7: note: declared here 2034 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:31: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 2051 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:31: note: read of non-const variable 'nnets' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2035:7: note: declared here 2035 | int nnets = system->nodes[NET].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2032:15: warning: unused variable 'ringRemap' [-Wunused-variable] 2032 | static char ringRemap[256]; | ^~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:4:42: warning: unused variable 'NvtxEnumRedSchema' [-Wunused-const-variable] 4 | static constexpr const nvtxPayloadEnum_t NvtxEnumRedSchema[] = { | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/proxy.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ [ 55%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/coll_net.cc.o In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/coll_net.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/coll_net.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/coll_net.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:22: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:24: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ipcsocket.cc:8: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ ct ncclTopoSystem* system, int64_t id, iIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ nt* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:25: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 1 warning generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/proxy.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/api_trace.cc:3: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/bootstrap.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/bootstrap.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx.h:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} 1 warning generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:22:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 22 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:25:10: warning: unused variable 'msgsize' [-Wunused-variable] 25 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:52:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 52 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:57:23: warning: unused variable 'payload' [-Wunused-variable] 57 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:80:38: warning: unused variable 'AllToAllSchema' [-Wunused-variable] 80 | constexpr nvtxPayloadSchemaEntry_t /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:512:10: warning: unused variable 'nBytes' [-Wunused-variable] 512 | size_t nBytes = count * ncclTypeSize(dataType); | ^~~~~~ AllToAllSchema[] = { In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_status.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:83:10: warning: unused variable 'msgsize' [-Wunused-variable] uint32_t y, head, mantissa; | ^ 83 | size_t msgsize = count * ncclTypeSize(datatype); | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:128:38: warning: unused variable 'AllToAllvSchema' [-Wunused-variable] 128 | constexpr nvtxPayloadSchemaEntry_t AllToAllvSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:132:23: warning: unused variable 'payload' [-Wunused-variable] 132 | NvtxParamsAllToAllv payload{sendcounts[comm->rank] * ncclTypeSize(datatype), recvcounts[comm->rank] * ncclTypeSize(datatype)}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:173:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 173 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:177:23: warning: unused variable 'payload' [-Wunused-variable] 177 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ 2 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:210:40: warning: unused variable 'GatherSchema' [-Wunused-variable] 210 | constex/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.ccp:104:33: warning: bitwise negation of a boolean expression always evaluates to 'true'; did you mean logical negation? [-Wbool-operation] 104 | if (ret_gpu_id == 0 && ~(ret_unique_id != 0 || ret_loc_id != 0 || ret_unique_id != 0 || ret_vendor != 0) && | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ! In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ r nvtxPayloadSchemaEntry_t GatherSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:214:22: warning: unused variable 'payload' [-Wunused-variable]/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:102:13: warning: unused variable 'ret_domain' [-Wunused-variable] 102 | int ret_domain = read_node_properties(node_id, "domain", &domain, properties); | ^~~~~~~~~~ 214 | NvtxParamsGather payload{sendcount * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:249:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 249 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:255:20: warning: unused variable 'payload' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 255 | Nvt/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:104:33: warning: bitwise negation of a boolean expression always evaluates to 'true'; did you mean logical negation? [-Wbool-operation] 104 | if (ret_gpu_id == 0 && ~(ret_unique_id != 0 || ret_loc_id != 0 || ret_unique_id != 0 || ret_vendor != 0) && | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ! xParamsReduce payload{count * /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:102:13: warning: unused variable 'ret_domain' [-Wunused-variable] 102 | int ret_domain = read_node_properties(node_id, "domain", &domain, properties); | ^~~~~~~~~~ ncclTypeSize(datatype), root, op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/socket.cc:598:8: warning: unused variable 'line' [-Wunused-variable] 598 | char line[SOCKET_NAME_MAXLEN+1]; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:281:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 281 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:286:27: warning: unused variable 'payload' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/debug.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 286 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ [ 55%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/net_tmp.cc.o In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.cc:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.cc:16: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:312:40: warning: /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/net_tmp.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/net_tmp.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/net_tmp.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc unused variable 'ScatterSchema' [-Wunused-variable] 312 | constexpr nvtxPayloadSchemaEntry_t ScatterSchema[] = { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:316:23: warning: unused variable 'payload' [-Wunused-variable] 316 | NvtxParamsScatter payload{recvcount * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:356:22: warning: unused variable 'payload' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 356 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:381:22: warning: unused variable 'payload' [-Wunused-variable] 381 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), pe[ 55%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/net_ib.cc.o er}; | ^~~~~~~ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/net_ib.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/net_ib.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/net_ib.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:232:22: warning: unused variable 'hops' [-Wunused-variable] 232 | uint64_t hops; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:69:14: warning: unused variable 'count' [-Wunused-variable] 69 | uint32_t count = 0; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/nvtx.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 2 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/npkit.cc:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit/npkit.h:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:232:22: warning: unused variable 'hops' [-Wunused-variable] 232 | uint64_t hops; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:69:14: warning: unused variable 'count' [-Wunused-variable] 69 | uint32_t count = 0; | ^~~~~ 49 warnings generated when compiling for gfx1100. 4 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static nccIn file included from l/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.cc:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.cc:16: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | statiResult_tc ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, ncclTopstruct kvDict* dict) { | ^~~~~~~~~~~~~~ oIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:23: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/utils.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:345:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 345 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ibvsymbols.cc:67: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 2 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rings.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_status.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_status.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/socket.cc:8: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:120:12: warning: unused variable 'y' [-Wunused-variable] 120 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:127:7: warning: unused variable 'localRanks' [-Wunused-variable] 127 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 55%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/net_socket.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/net_socket.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/net_socket.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/net_socket.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_socket.cc In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/bootstrap.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 56%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/nvls.cc.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/nvls.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/nvls.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/nvls.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/nvls.cc 2 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: 1 warning generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init_nvtx.cc:4:42: warning: unused variable 'NvtxEnumRedSchema' [-Wunused-const-variable] 4 | static constexpr const nvtxPayloadEnum_t NvtxEnumRedSchema[] = { | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.cu.cpp:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/onerank.cu.cpp:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common_kernel.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. 1 warning generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.cu.cpp:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 4 warnings generated when compiling for host. 2 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:22:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 22 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:25:10: warning: unused variable 'msgsize' [-Wunused-variable] 25 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:52:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 52 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:57:23: warning: unused variable 'payload' [-Wunused-variable] 57 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ [ 56%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/p2p.cc.o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:272:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 272 | int intermediateIndex = -1; | ^ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/p2p.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/p2p.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/p2p.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:80:38: warning: unused variable 'AllToAllSchema' [-Wunused-variable] 80 | constexpr nvtxPayloadSchemaEntIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/proxy.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ ry_t AllToAllSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:83:10: warning: unused variable 'msgsize' [-Wunused-variable] 83 | size_t msgsize = count * ncclTypeSize(datatype); | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:128:38: warning: unused variable 'AllToAllvSchema' [-Wunused-variable] 128 | constexpr nvtxPayloadSchemaEntry_t AllToAllvSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:132:23: warning: unused variable 'payload' [-Wunused-variable] 132 | NvtxParamsAllToAllv payload{sendcounts[comm->rank] * ncclTypeSize(datatype), rIn file included from e/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/onerank.cu.cpp:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common_kernel.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ cvcounts[comm->rank] * ncclTypeSize(datatype)}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:173:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 173 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:177:23: warning: unused variable 'payload' [-Wunused-variable] 177 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:210:40: warning: unused variable 'GatherSchema' [-Wunused-variable] 210 | constexpr nvtxPayloadSchemaEntry_t GatherSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:214:22: warning: unused variable 'payload' [-Wunused-variable] 214 | NvtxParamsGather payload{sendcount * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTop31 warnings generated when compiling for host. oRankToInde/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:249:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 249 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:255:20: warning: unused variable 'payload' [-Wunused-variable] 255 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op}; | ^~~~~~~ x(struct ncclTopoSystem* system/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:281:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 281 | conste2 warnings generated when compiling for host. xpr nvtxPayloadSchemaEntry_t ReduceScat/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:459:24: warning: unused variable 'gpu' [-Wunused-variable] 459 | struct ncclTopoNode* gpu = system->nodes[GPU].n,o dienst+ gr;a n k| , ^~~ int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:261:21: warning: unused function 'getIndexes' [-Wunused-function] 261 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:435:21: warning: unused function 'connectNvls' [-Wunused-function] 435 | static ncclResult_t connectNvls(struct ncclComm* comm, int* nvlsHeads, int nHeads) { | ^~~~~~~~~~~ terSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:286:27: warning: unused variable 'payload' [-Wunused-variable] 286 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype1 warning generated when compiling for gfx1100. ), op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/socket.cc:598:8: warning: unused variable 'line' [-Wunused-variable] 598 | char line[SOCKET_NAME_MAXLEN+1]; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:312:40: warning: unused variable 'ScatterSchema' [-Wunused-variable] 312 | constexpr nvtxPayloadSchemaEntry_t ScatterSchema[] = { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:316:23: warning: unused variable 'payload' [-Wunused-variable] 316 | [ 56%] Building CXX object CMakeFiles/rccl.dir/hipify/src/transport/shm.cc.o NvtxParamsScatter payload{recvcount * ncclTypeSize(datatype), root}; | ^~~~~~~ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/shm.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/shm.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/shm.cc.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/shm.cc /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:356:22: warning: unused variable 'payload' [-Wunused-variable] 356 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:381:22: warning: unused variable 'payload' [-Wunused-variable] 381 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/search.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ [ 56%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_gather_sum_i8.cpp.o [ 57%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_gather_sum_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_gather_sum_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_gather_sum_i8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:51:20: warning: unused variable 'kPathDRMRoot' [-Wunused-variable] 51 | s/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cct:1044:7: warning: unused variable 'nChannels' [-Wunused-variable] 1044 | int nChannels = 0; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1054:12: warning: unused variable 'y' [-Wunused-variable] 1054 | int x=0, y=0; | ^ atic const char *kPathDRMRoot = "/sys/class/drm"; | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:558:13: warning: unused function 'fileExists' [-Wunused-function] 558 | static bool fileExists(char const *filename) | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/socket.cc:8: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem*2 warnings generated when compiling for gfx1100. system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/collectives.cc:345:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 345 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 57%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp [ 57%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp 2 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/npkit.cc:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/npkit/npkit.h:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 2 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:14: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1563 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:14: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1538:7: note: declared here 1538 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:24: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1563 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1563:24: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1538:7: note: declared here 1538 | int ngpus = system->nodes[GPU].count; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* systIn file included from e/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:32:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 32 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ m, int dev,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1535:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1535 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1554:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1554 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1625:9: warning: unused variable 't' [-Wunused-variable] 1625 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.t/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.ccv:_338us:e10c: - warning: tunused variable 'llMaxBw' [-Wunused-variable]v s.tv_use c338) | / 1 Ed3o;u b l| e ^ llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 339 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 340 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 341 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:344:9: warning: unused variable 'ppn' [-Wunused-variable] 344 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/paths.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int*[ 57%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f32.cpp.o value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXmIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ l* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* pr2 warnings generated when compiling for host. ev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetA/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1712:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1712 | static char ringRemap[64]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1716:7: warning: unused variable 'ncpus' [-Wunused-variable] 1716 | int ncpus = system->nodes[CPU].count; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1809:9: warning: unused variable 't' [-Wunused-variable] 1809 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ ttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1892:11: warning: 'NUMA_CPUS' macro redefined [-Wmacro-redefined] 1892 | #define NUMA_CPUS 4 | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1530:11: note: previous definition is here 1530 | #define NUMA_CPUS 2 | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1895:11: warning: 'TOTAL_PERMUTE_COUNT' macro redefined [-Wmacro-redefined] 1895 | #define TOTAL_PERMUTE_COUNT (NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1533:11: note: previous definition is here 1533 | #define TOTAL_PERMUTE_COUNT (NUMA_PERMUTE_COUNT*NUMA_PERMUTE_COUNT) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:14: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1927 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:14: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1900:7: note: declared here 1900 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:24: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1927 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1927:24: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1900:7: note: declared here 1900 | int ngpus = system->nodes[GPU].count; | ^ [ 58%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1897:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1897 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1918:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1918 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:1993:9: warning: unused variable 't' [-Wunused-variable] 1993 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ 2 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:338:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 338 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 339 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 340 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 341 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:344:9: warning: unused variable 'ppn' [-Wunused-variable] 344 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:15: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 2051 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:15: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2034:7: note: declared here 2034 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:31: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 2051 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2051:31: note: read of non-const variable 'nnets' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2035:7: note: declared here 2035 | int nnets = system->nodes[NET].count; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:626:14: warning: unused variable 'treeCorrectionFactor' [-Wunused-variable] 626 | static float treeCorrectionFactor[NCCL_NUM_PROTOCOLS][23] = { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:2032:15: warning: unused variable 'ringRemap' [-Wunused-variable] 2032 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:127:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 127 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ 4 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/ipcsocket.cc:8: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:51:20: warning: unused variable 'kPathDRMRoot' [-Wunused-variable] 51 | static const char *kPathDRMRoot = "/sys/claIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ ss/drm"; | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/alt_rsmi.cc:558:13: warning: unused function 'fileExists' [-Wunused-function] 558 | static bool fileExists(char const *filename) | ^~~~~~~~~~ 2In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncc6 warnings generated when compiling for gfx1100. lResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 13 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:22: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:24: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rome_models.cc:25: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/rings.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:53:38: warning: unused variable 'MscclSchema' [-Wunused-variable] 53 | constexpr nvtxPayloadSchemaEntry_t MscclSchema[] = { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:57:19: warning: unused variable 'payload' [-Wunused-variable] 57 | NvtxParamsMsccl payload{sendCounts[comm->rank] * ncclTypeSize(dataType), recvCounts[comm->rank] * ncclTypeSize(dataType)}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/tuning.cc:626:14: warning: unused variable 'treeCorrectionFactor' [-Wunused-variable] 626 | static float treeCorrectionFactor[NCCL_NUM_PROTOCOLS][23] = { | ^~~~~~~~~~~~~~~~~~~~ 1 warning generated when compiling for host. 31 warnings generated when compiling for gfx1100. 3 warnings generated when compiling for host. 15 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/utils.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 2 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ 2 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ 3 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ 2 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:120:12: warning: unused variable 'y' [-Wunused-variable] 120 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:127:7: warning: unused variable 'localRanks' [-Wunused-variable] 127 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ [ 58%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u32.cpp.o [ 58%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc:24: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ [ 59%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u8.cpp.o [ 59%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/rocm_smi_wrap.cc:24: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp [ 59%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf16.cpp.o In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp [ 59%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; }21 :| ^~~~~~~~~~~~~warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 222 | static ncclResu l29t | _stta tniccc lnTcocploRReasnuklTto_Itn dceoxl(lsNtertuTcets t(nsctcrluTcotp onScycsltCeomm*m *s ycsotmme,m ,v oiindt* rraenqku,e sitn,t *i nitn*d edxo)n e{, i| n ^~~~~~~~~~~~~~~~~~~t * size) { NCCLC/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.hHE:C233K:(21c:o mwarning: munused function 'ncclTopoDevToRank' [-Wunused-function]- >ncclCollNet -233> | tsetsatt(irce qnucecsltR,e sduolnte_,t sniczcel)T)o;p orDeetvuTronR annckc(lsSturcuccets sn;c c}l T o| p ^~~~~~~~~~~o System* s/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.hy:s30t:e21m:, warning: iunused function 'collNetCloseColl' [-Wunused-function]n t dev, int* ran k30) | s{t a t| i ^~~~~~~~~~~~~~~~~c ncclRes/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.hul:t245_:t21 :c owarning: lunused function 'ncclTopoIdToNetDev' [-Wunused-function]l NetCloseCol l245( | ssttrautcitc nnccccllCRoemsmu*l tc_otm mn,c cvloTiodp*o IcodlTloCNoemtmD)e v{( sNtCrCuLcCtH EnCcK(ccloTmomp-o>SnycsctleCmo*l lsNyestt-e>mc,l oisnetC6o4l_lt(c oildl,C oimnmt)*) ;n erteDteuvr)n {n c c| l ^~~~~~~~~~~~~~~~~~S uccess; /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h}: 258 :| 14 ^~~~~~~~~~~~~~~~: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21 :258 | warning: sunused function 'collNetCloseListen' [-Wunused-function]t atic float ncclTop o31X | GsMtIaStpiece dn(cccolnRsets uclhta_rt* cgoclnlN)e t{C l o| s ^~~~~~~~~~~~~~~~~e Listen/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h(:s268t:r14u:c twarning: unused function 'ncclTopoNVLinkBw' [-Wunused-function]n cclComm* c268o | msm,t avtoiidc* flilsotaetn Cnomcmc)l T{o pNoCCNLVCLHEiCnKk(Bcwo(mimn-t> nccucdlaCCoolmlpNCeatp-)> cl{o s e| L ^~~~~~~~~~~~~~~~i sten(/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.hl:i279s:te13n:C omwarning: munused function 'isPow2' [-Wunused-function]) ); re t279u | rsnt antciccl Subcocoesls ;i s}P o w| 2 ^~~~~~~~~~~~~~~~~~( int val) In file included from {/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc : 17: | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h ^~~~~~: 124:21/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:: 282warning: :unused function 'xmlGetAttrLong' [-Wunused-function]12 : warning: unused function 'mirrorBits' [-Wunused-function] 282 | 124s | tsattaitci ci nntc cmliRrersoulrtB_itt sx(milnGte tvAatlt,r Lionngt( sptorwu2c)t {n c c| l ^~~~~~~~~~X mlNode* no/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.ccd:e261,: 21c:o nwarning: sunused function 'getIndexes' [-Wunused-function]t char* attr N261a | mset,a tiinct 6n4c_ctl*R evsaullute_)t {g e t| I ^~~~~~~~~~~~~~n dexes(in/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.ht:*151 :r21a:n kwarning: sunused function 'xmlFindNextTag' [-Wunused-function], int* indexes, i151n | ts tnaNtoidce sn)c c{l R e| s ^~~~~~~~~~u lt_t xm/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/connect.ccl:F435i:n21d:N exwarning: tunused function 'connectNvls' [-Wunused-function]T ag(struct n c435c | lsXtmalt* ixcm ln,c ccloRnesstu lcth_atr *c otnangeNcatmNev,l sstruct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* su(bNsatmreu,c ts tnrcuccltC onmcmc*l XcmolmNmo,d ei*n*t *su bn,v lcsoHnesatd sc,h airn*t antHteraNdasm)e ,{ co n| s ^~~~~~~~~~~t int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ [ 59%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp [ 60%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 3 warnings generated when compiling for host. 1 warning generated when compiling for host. 2 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:53:38: warning: unused variable 'MscclSchema' [-Wunused-variable] 53 | constexpr nvtxPayloadSchemaEntry_t MscclSchema[] = { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:57:19: warning: unused variable 'payload' [-Wunused-variable] 57 | NvtxParamsMsccl payload{sendCounts[comm->rank] * ncclTypeSize(dataType), recvCounts[comm->rank] * ncclTypeSize(dataType)}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/group.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 29 warnings generated when compiling for gfx1100. 7 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 1 warning generated when compiling for gfx1100. 1 warning generated when compiling for gfx1100. [ 60%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp [ 60%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:127:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 127 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ | ^~~~~~~~~~~~~~~~~ [ 60%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp 4 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/msccl.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ [ 61%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp 1 warning generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:1967:11: warning: unused variable 'stackSize' [-Wunused-variable] 1967 | int64_t stackSize; | ^~~~~~~~~ 2 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:1968:19: warning: unused variable 'devProp' [-Wunused-variable] 1968 | hipDeviceProp_t devProp; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/npkit.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/api_trace.cc:3: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 15[ 61%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u8.cpp.o warnings generated when compiling for host. /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.cu.cpp:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2357:26: warning: unused variable 'payload' [-Wunused-variable] 2357 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:100:5: warning: unused label 'ignore0' [-Wunused-label] 100 | ignore0:; | ^~~~~~~~ [ 61%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp 2 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2371:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2371 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:10: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.cc:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ [ 61%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:399:7: warning: variable 'rnChannels' set but not used [-Wunused-but-set-variable] 399 | int rnChannels = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2701:26: warning: unused variable 'payload' [-Wunused-variable] 2701 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2731:26: warning: unused variable 'payload' [-Wunused-variable] 2731 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:506:7: warning: variable 'rnChannel' set but not used [-Wunused-but-set-variable] 506 | int rnChannel = 0; | ^ 7 warnings generated when compiling for host. 3 warnings generated when compiling for gfx1100. [ 62%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/npkit.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:610:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 610 | struct ncclWorkElemP2p elem = {0}; | ^ | {} In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ 13 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ [ 62%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f32.cpp.o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h[ 62%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f64.cpp.o :18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:/usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp 21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:37: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:38: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct 1 warning generated when compiling for gfx1100. ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:906:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 906 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2342:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 2342 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/onerank.cu.cpp:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_setup.cc:6: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ [ 63%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp [ 63%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:100:5: warning: unused label 'ignore0' [-Wunused-label] 100 | ignore0:; | ^~~~~~~~ 2 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:399:7: warning: variable 'rnChannels' set but not used [-Wunused-but-set-variable] 399 | int rnChannels = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:506:7: warning: variable 'rnChannel' set but not used [-Wunused-but-set-variable] 506 | int rnChannel = 0; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:610:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 610 | struct ncclWorkElemP2p elem = {0}; | ^ | {} In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:7: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/onerank.cu.cpp:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 30 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 55 warnings generated when compiling for gfx1100. 2 warnings generated when compiling for host. 9 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:512:10: warning: unused variable 'nBytes' [-Wunused-variable] 512 | size_t nBytes = count * ncclTypeSize(dataType); | ^~~~~~ [ 63%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp 9 warnings generated when compiling for host. 1 warning generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:29: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xml[ 63%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u8.cpp.o FindTag(struct ncclXml* xm/usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp l, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static nIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ cclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* nodIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ e, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ [ 64%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp 9 warnings generated when compiling for host. 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 4 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:1967:11: warning: unused variable 'stackSize' [-Wunused-variable] 1967 | int64_t stackSize; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:1968:19: warning: unused variable 'devProp' [-Wunused-variable] 1968 | hipDeviceProp_t devProp; | ^~~~~~~ 49 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2357:26: warning: unused variable 'payload' [-Wunused-variable] 2357 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2371:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2371 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ [ 64%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f16.cpp.o [ 64%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp 23 warnings generated when compiling for gfx1100. [ 64%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f32.cpp.o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2701:26: warning: unused variable 'payload' [-Wunused-variable] 2701 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2731:26: warning: unused variable 'payload' [-Wunused-variable] 2731 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ [ 65%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp 2 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:17: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:37: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:38: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:906:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 906 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/init.cc:2342:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 2342 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm,In file included from v/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cppo:i1d: *In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hd:a13t: aIn file included from ,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h :s13iz: e/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h_:t76 :s18i:z e,warning: unused variable 'y' [-Wunused-variable]i nt type, u i76n | t6 4 _ t o f f sueitn,t 3i2n_tt yf,d ,h evaodi,d *m* amnhtaindslsea); { | N ^CC LCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:47:21: warning: unused function 'computeColl' [-Wunused-function] 47 | static ncclResult_t computeColl(struct ncclInfo* info /* input */, int* workFuncIndex, struct ncclWorkElem* work, struct ncclProxyOp* proxyOp /* output */); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:61:21: warning: unused function 'getLoopInfo' [-Wunused-function] 61 | static ncclResult_t getLoopInfo(struct ncclInfo* collInfo); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:794:21: warning: unused function 'getCBDCollnChannel' [-Wunused-function] 794 | static ncclResult_t getCBDCollnChannel(struct ncclKernelPlan* plan, struct ncclInfo* collInfo, int usableChannels) { | ^~~~~~~~~~~~~~~~~~ 2 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 65%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/misc/msccl/msccl_lifecycle.cc:32:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 32 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ 2 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_ib.cc:29: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:75:21: warning: unused function 'xmlAlloc' [-Wunused-function] 75 | static ncclResult_t xmlAlloc(struct ncclXml** xml, int maxNodes) { | ^~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:110:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 110 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:117:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 117 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:124:21: warning: unused function 'xmlGetAttrLong' [-Wunused-function] 124 | static ncclResult_t xmlGetAttrLong(struct ncclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:132:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 132 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:139:21: warning: unused function 'xmlFindTag' [-Wunused-function] 139 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:151:21: warning: unused function 'xmlFindNextTag' [-Wunused-function] 151 | static ncclResult_t xmlFindNextTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode* prev, struct ncclXmlNode** node) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:163:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 163 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:179:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 179 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:192:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 192 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:204:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 204 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:217:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 217 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:230:21: warning: unused function 'xmlSetAttrLong' [-Wunused-function] 230 | static ncclResult_t xmlSetAttrLong(struct ncclXmlNode* node, const char* attrName, const int64_t value) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:243:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 243 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:255:21: warning: unused function 'xmlGetSub' [-Wunused-function] 255 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:281:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 281 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:288:21: warning: unused function 'xmlAddNode' [-Wunused-function] 288 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:310:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 310 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:323:21: warning: 'static' function 'xmlAddTree' declared in header file should be declared 'static inline' [-Wunneeded-internal-declaration] 323 | static ncclResult_t xmlAddTree(struct ncclXml* dst, struct ncclXmlNode* parent, struct ncclXmlNode* srcNode) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:353:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 353 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/xml.h:366:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 366 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:11: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ [ 65%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u32.cpp.o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:47:21: warning: unused function 'computeColl' [-Wunused-function] 47 | static ncclResult_t computeColl(struct ncclInfo* info /* input */, int* workFuncIndex, struct ncclWorkElem* work, struct ncclProxyOp* proxyOp /* output */); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:61:21: warning: unused function 'getLoopInfo' [-Wunused-function] 61 | static ncclResult_t getLoopInfo(struct ncclInfo* collInfo); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/enqueue.cc:794:21: warning: unused function 'getCBDCollnChannel' [-Wunused-function] 794 | static ncclResult_t getCBDCollnChannel(struct ncclKernelPlan* plan, struct ncclInfo* collInfo, int usableChannels) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(sIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ truct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 15 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 10 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/p2p.cc:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 2 warnings generated when compiling for host/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ . 29 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 37 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:19: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:245:21: warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 245 | static ncclResult_t ncclTopoIdToNetDev(struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:277:21: warning: unused function 'netDumpMap' [-Wunused-function] 277 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ [ 65%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.hIn file included from :13/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp: :/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h2:: 76In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: In file included from warning: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uIn file included from in/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cppt:312: _In file included from t/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h :y13,: In file included from h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.he:a13d: ,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h :m76a:n18t:i swarning: sunused variable 'y' [-Wunused-variable]a ; | ^ 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32 warnings generated when compiling for gfx1100. 2_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2,In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ 10 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 66%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:199:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 199 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:402:21: warning: unused function 'sharedBuffersGet' [-Wunused-function] 402 | static ncclResult_t sharedBuffersGet(struct ncclCollNetSharedRes* collNet, int type, int slot, int channel, int* offset) { | ^~~~~~~~~~~~~~~~ tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: tid(tid), nthreads(nunused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ threads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1:In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:9: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mh/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ andle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct nccl/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hCo:m667m:*15 :c omwarning: minitializer order does not match the declaration order [-Wreorder-ctor], void* collComm, v o667i | d * s etniddD(attiad,) ,v onitdh*r eraedcsv(Dnatthar,e aidnst) ,c otuindtI,n BnlcocclkD(attharTeyapdeI_dtx .dxa)t,a Tgyrpoeu,p (ngcrcoluRpe)d,O p _| t ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ r e| d tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_O p, void* send M668h | a n d l es,t evpoSiidz*e (rsetcevpMShiazned_l e=,= 0v o?i dn*c*c lreSqhumeesmt.)c o{m m .| b ^~~~~~~~~~~~~~~~~u ffSizes[/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.hN:C28C:L21_:P Rwarning: Ounused function 'collNetIflush' [-Wunused-function]T O_SIMPLE]/NCCL_STEPS /28s | iszteaotfi(cT n)c c:l RsetseupSlitz_et_ c)o l{l N e| t ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~I f l| u group(groups h(struct ncclCom/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hm:*301 :c90o:m mnote: ,in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here void* coll Co301m | m , v o i dP*r idamtiat,i vienst< Ts,i zRee,d Ovpo,i dF*a nmAhsaynmdmleet,r ivcoE,C K/(*cDoimrme-c>tn=c*c/l0C,o lPlrNoetto-,> i0f>l upsrhi(mcso l l| C ^o mm, data, /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hs:i565z:e5,: mnote: hin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested herea ndle, re q565u | e st ) ) ;r urneTtruerenU ncclSuccess; } | ^~~~~~~~~~~~~ pDow/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.hn:<29T:,21 :R ewarning: dunused function 'collNetTest' [-Wunused-function]O p, ProtoSimple<1, 1,29 | CsOtLaLt_iUcN RnOcLcLl>R,e sCuOlLtL__tU NcRoOlLlLN>e(taTregsst)(;s t r| u ^c t ncclComm* com/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hm:, 203v:o66i:d *note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested herer equest, i n203t | * d o n e , iRnutn*W osrikzEel)e m{e nNtC nAclcgloC,o lPlrNoetto-,> tCeOsLtL(_rUeNqRuOeLsLt>,( )d.ornuen,( swiez)e;) ) ;| ^r eturn ncclSu/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cppc:c7e:s1s:; note: }in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h: 307: | 21D:E Fwarning: Iunused function 'collNetCloseColl' [-Wunused-function]N E_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:199:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 199 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/coll_net.cc:402:21: warning: unused function 'sharedBuffersGet' [-Wunused-function] 402 | static ncclResult_t sharedBuffersGet(struct ncclCollNetSharedRes* collNet, int type, int slot, int channel, int* offset) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDIn file included from o/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ wn, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ MPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthread23s warnings generated when compiling for host. (nthreads), tidInBlock(threadIdx.x), gIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ roup(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), In file included from group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 2 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, In file included from al/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cppg:o2,: In file included from p/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hr:o10t: oIn file included from ,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h :4167>: (/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h):.667r:u15n:( &warning: ninitializer order does not match the declaration order [-Wreorder-ctor]c clShmem.work); \ | ^667 | tid(/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.ht:i667d:)15,: nnote: thfield 'nthreads' will be initialized after field 'tidInBlock'r eads(nthre a667d | s ) , ttiiddI(ntBildo)c,k (ntthhrreeaaddIsd(xn.txh)r,e agdrso)u,p (tgirdoInuBpl)o,c k (| t ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~h r e| a tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_d Idx.x), gro u668p | ( g r o uspt)e,p S i| z ^~~~~~~~~~~~~~~~~e(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 15 warnings generated when compiling for host. [ 66%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ (nthreads), tidInBlockIn file included from (threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h32:_370t: 19d:a twarning: a1unused variable 'size' [-Wunused-variable], flag1, d370a | t a 2 , cfolnasgt2 ;s s i| z ^~~~~e _t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 66%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ CL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2In file included from >/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ ().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tid/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeo/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ f(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDowncount; | ^~~~ ple<1, 1, COLL_UNROLL>, COLL_UNIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ ROIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ LL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWorkcount; | ^~~~ , ty, redop, algo, proto, 4>().run(&ncclShmem./builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSiIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ ze_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 23 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 62 | Prim/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hi:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tidC(tOiLdL)_,U NnRtOhLrLe>a,d sC(OnLtLh_UrNeRaOdLsL)>,( atrigdsI)n;B l o| c ^k (threadIdx.x), /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hg:r203o:u66p:( gnote: rin instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested hereo up), | ^~~~~~~~~~~ 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ [ 67%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp.o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2;/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, pIn file included from roto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nth/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ reads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | st/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable]In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:19: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 211 | static ncclR 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ esult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, inIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140t type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 222 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:233:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 233 | static ncclResult_t ncclTop:o28D:e vwarning: Tounused variable 'data2' [-Wunused-variable]R ank(struc t 140n | c c l T oupionSty3s2t_etm *d astyas1t,e mf,l aign1t, ddeavt,a 2i,n tf*l arga2n;k ) | { ^~~~~ | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h::35245:: 21warning: :unused variable 'flag2' [-Wunused-variable] warning: unused function 'ncclTopoIdToNetDev' [-Wunused-function] 140 | u245i | nstt3a2t_itc dnactcal1R,e sfullatg_1t, ndcactlaT2o,p ofIldaTgo2N;e t D| e ^~~~~v (struct ncclTopoSystem* system, int64_t id, int* netDev) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:258:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 258 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:268:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 268 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:279:13: warning: unused function 'isPow2' [-Wunused-function] 279 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/graph/topo.h:282:12: warning: unused function 'mirrorBits' [-Wunused-function] 282 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/transport/net_tmp.cc:277:21: warning: unused function 'netDumpMap' [-Wunused-function] 277 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:159:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 159 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ eUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hp:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ roto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | PrimIn file included from it/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cppi:ve2s: , 0, Proto, 0> pr667i | m s | t ^i d(tid), nthr/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.he:a558d:s5(:n tnote: hrin instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested heree ads), t i558d | I n B l orcukn(Rtihnrge tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_( args); | ^ 668 | step/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hS:iz203e:(66s:t enote: pin instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested hereS ize_ == 0 203? | n c c l S h m eRmu.ncWoomrmk.EbluefmfeSnitzT()) .:r usnt(ewpeS)i;z e_ )| ^{ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h :12252 | :D90E:F Inote: NEin instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here_ ncclDevFunc (252A | l l R e d u cPer_iRmIiNtGi_vSeIsMf,, /N*CDCiLr_eAcLtG=O*_/R0I,N GP,r oNtCoC, L0_>P RpOrTiOms_ S I| M ^P LE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h::409565::525:: note: note: expanded from macro 'DEFINE_ncclDevFunc'in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 409 | 565 | RruunnWTorrekeo,t oaSligmop,l epO(L)L._rUuNnR(O&LnLc>c,l SChOmLeLm_.UwNoRrOkL)L;> (\a r g| s ^) ; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock'/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h :203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 667 | t i203d | ( t i d ) , n tRhurneWaodrsk(Enltehmreenatdp()).,r u n| ( ^~~~~~~~~~~~~~~~~w e); | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h ^: 667:60: note: field 'group' will be initialized after field 'stepSize' /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: 667note: | in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here tid(tid), n7t | hDrEeaFdIsN(En_tnhcrcelaDdesv)F,u ntci(dAIlnlBRleodcukc(et_hTrReEaEd_ISdIxM.PxL)E,_ PgrreoMuupl(Sgurmo_uup3)2,, n c| c ^~~~~~~~~~~l FuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:159:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 159 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:159:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 159 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' In file included from 667/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp | : 2 : /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.ht:i33d:(19t:i dwarning: )unused variable 'size' [-Wunused-variable], nthreads(nt h33r | e a d s )c,o ntsitd IsnsBilzoec_kt( tshirzee a=d Iadrxg.sx-)>,c ogurnotu;p ( g| r ^~~~o up), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ T, RedOp, Proto, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ , Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ ulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthre/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ tid(tid), nthreads(nthIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ reads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ 16 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.In file included from co/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cppm:m2.: bIn file included from u/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hf:f10Si: zIn file included from e/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.hs:[168N: C/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hC:L140_:P14R: OTwarning: Ounused variable 'data1' [-Wunused-variable]_ SIMPLE]/ N140C | C L _ S TuEiPnSt/3s2i_zte ofd(aTt)a 1:, sftleapgS1i,z ed_a)t a{2 , | f ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~l a g| 2 group(group; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hunused variable 'flag1' [-Wunused-variable]: 62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 140 | ui n62t | 3 2 _ t Pdraitmai1t,i vfelsa, 0/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h,: 140P:r28o:t owarning: ,unused variable 'data2' [-Wunused-variable] 0> prim s140 | | ^ uint32_t/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h :d558a:t5a:1 , note: fin instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested herela g1, da t558a | 2 , f lraugn2R; i n| g ^~~~~< T, Re/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hd:O140p:,35 :P rwarning: ounused variable 'flag2' [-Wunused-variable]t o, COLL _140U | N R O L Lu>i(natr3g2s_)t; d a| t ^a 1, flag1, da/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.ht:a2032:,66 :f lnote: agin instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here2 ; | ^~~~~ 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / chaIn file included from n/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:60:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 60 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_gather.h:159:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 159 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_i8, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_ST/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hE:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ PS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_n cclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128OffIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: set; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | steIn file included from p/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ Size(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_)In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t 17da warningtsa generated1 when compiling for host,. flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*D/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ irect=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ &nc[ 67%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp.o c/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ lShmem.work); \ | /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads),/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252: tidInBlock90(threadIdx.x), group(group), | ^~~~~~~~~~~ : note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.workIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ ); \ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ : warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mant/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp| tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_: 2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168 : 668/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h | :140 : 14 :s twarning: eunused variable 'data1' [-Wunused-variable]p Size(stepSiz e140_ | = = 0u i?n tn3c2c_ltS hdmaetma.1c,o mfml.abgu1f,f Sdaitzeas2[In file included from N,C /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cppC:fL2l_: aPgIn file included from R2/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hO;T: O10 _| : In file included from S/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h ^~~~~I: M168: P/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hL:E140]/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:/:14N:140C :warning: C21unused variable 'data1' [-Wunused-variable]L:_ Swarning: Tunused variable 'flag1' [-Wunused-variable]E P S140/ | s i z e140 | ou fi (n Tt 3)u2 i:_n tts 3tde2a_pSttai 1zdea_,)t af{1l ,a | g ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~1f, l adg| 1a group(group,t ad2a,t af2l,a gf2l;a g 2/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h| ;: ^~~~~ 252 :| 90 ^~~~~: note: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hin instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here: 140:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h21::140 :warning: 28unused variable 'flag1' [-Wunused-variable]: warning: 252unused variable 'data2' [-Wunused-variable] | 140 | Pr i 140m | i tu ii n vtue3is2n<_tTt3, 2d _aRtte add1Oa,pt ,af 1lF,aa gnf1Al,sa ygdm1am,te atd2ar,ti acf235,unused variable 'data2' [-Wunused-variable]: /warning: *unused variable 'flag2' [-Wunused-variable]D ire c140t | = * /1400 | , u Pi rn otut3io2n_,tt 3 02d>_a ttp ard1ia,mt saf1l ,a g| f1 ^l, a gd1a,t ad2a,t af2/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hl,:a 565gf:25l;a: g 2note: | ;in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here ^~~~~ | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140: 35565: | warning: unused variable 'flag2' [-Wunused-variable] runTre e140U | p D o w nu , COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ issa; | ^ 16 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: 9 warnings generated when compiling for host. unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp370::219: :In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hwarning: :10unused variable 'size' [-Wunused-variable]: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270: 19370: | warning: unused variable 'ptr' [-Wunused-variable] const ss i270z | e _ t s i z e ui=n tar6g4s_-t>*c oputnrt ;= r| e ^~~~c vPtr(0/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:)371+:l15l:12 8warning: Ounused variable 'bid' [-Wunused-variable]f fset; 371 | | ^~~ const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.b/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1:In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ uffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ :252:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h10:: 203In file included from :/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h66::168 : note: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hin instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here: 140:14: warning: unused variable 'data1' [-Wunused-variable] 203 | R u140n | W o r k Eulienmte3n2t_()./builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hr:u140n:(21w:e )warning: ;unused variable 'flag1' [-Wunused-variable] | ^ 140 | ui/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cppn:t73:21_t: dnote: ain instantiation of member function 'RunWork, 0, 2, 4>::run' requested heret a1, flag1, da t7a | 2D,E FfIlNaEg_2n;c c l| D ^~~~~e vFunc(/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hA:l140l:R28e:d uwarning: ceunused variable 'data2' [-Wunused-variable]_ T 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ mmetric, /*Direct=*/0, Proto, 0> priREE_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ms | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ [ 67%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor]17 warnings generated when compiling for host. 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ RedOp, Algo, Proto, COLL_UNROLL>().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_In file included from T/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ REE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthr/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ eads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ 301:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_gather_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement2(;) . r| un ^~~~~( we);/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h : 140| : ^35 : warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp_:t7 :d1a:t anote: 1in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here, flag1, data2, 7f | lDaEgFI2N;E _ n| c ^~~~~c lDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_n c | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ clDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threa/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ dIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:3355:19 warning:s generated when compiling for hostwarning: . unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tiIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ d(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | PrimitivesIn file included from , FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreIn file included from ad/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpps):,2 : tIn file included from i/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hd:I10n: BIn file included from l/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.ho:c167k: (t/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hh:r667e:a15d:I dwarning: xinitializer order does not match the declaration order [-Wreorder-ctor]. x), group(group), 667| | ^~~~~~~~~~~~~~~~~ tid/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h(:t667i:d60):, note: nfield 'group' will be initialized after field 'stepSize't hreads(nthr e667a | d s ) , ttiiddI(ntBildo)c,k (ntthhrreeaaddIsd(xn.txh)r,e agdrso)u,p (tgirdoIunpB)l,o c k| ( ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~t h r| e tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_a dIdx.x), g r668o | u p ( g rsotuepp)S,i z e| ( ^~~~~~~~~~~s tepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ T, RedOp, FanAsymmetric, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] [ 67%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/alltoall_pivot_sum_i8.cpp.o 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/alltoall_pivot_sum_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/alltoall_pivot_sum_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/alltoall_pivot_sum_i8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ 15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] (group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes17 warnings generated when compiling for host. [NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuIn file included from nc/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cppA:l2l: RIn file included from e/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hd:u10c: eIn file included from ,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h :F169u: nc/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.hP:r270o:d19,: rwarning: ccunused variable 'ptr' [-Wunused-variable]l _bfloat8, NCCL _270A | L G O _ T R E E ,u iNnCtC6L4__PtR*O TpOt_rS I=M PrLeEc)v P t| r^( 0)+ll128Of/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hf:s406e:t52;: note: | expanded from macro 'DEFINE_ncclDevFunc' ^~~ 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u32, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u8, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hnthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_u64, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ _SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | | ^ tid(tid), nthre/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.ha:ds565(:n5t:h rnote: ein instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested herea ds), tidIn B565l | o c k ( trhurneTardeIedUxp.Dxo)w,n , /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hC:O667L:L60_:U Nnote: Rfield 'group' will be initialized after field 'stepSize'O LL>(args); 667 | | ^ tid(tid), nt/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hh:r203e:a66d:s (note: nin instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested heret hreads), t203i | d I n B l o c k (RtuhnrWeoardkIEdlxe.mxe)n,t ().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x),/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ p), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/size/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ of(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, In file included from Pr/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cppot:o2,: In file included from 0/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h>: 10p: rIn file included from i/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.hm:s168 : /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h| : ^140 :14: warning: unused variable 'data1' [-Wunused-variable] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: 140note: | in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here uint32 _565t | d a t ar1u,n TfrleaegU1p,D odwant | , C O LuLi_nUtN3R2O_LtL >d(aatrag1s,) ;f l a| g ^1 , data2, fla/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hg:2203;: 66 :| ^~~~~note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: 203warning: | unused variable 'data2' [-Wunused-variable] R u140n | W o r k Eulienmte3n2t_/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h(:)140.:r35u:n (warning: wunused variable 'flag2' [-Wunused-variable]e ); | ^ 140 | uint3/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp2:_7t: 1d:a tnote: a1in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here, flag1, data 27, | DfElFaIgN2E;_ n c| c ^~~~~l DevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f16, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runT/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ reeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371In file included from | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count;/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, nccl | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: In file included from unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2iIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ (long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 33 | cIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ onst ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f16, ncclFuIn file included from ncA/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f16.cppl:l1Re: dIn file included from u/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hc:e17,: In file included from F/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.hu:n11c: MIn file included from i/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.hn:M12a: xIn file included from ,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h :h126a: lIn file included from f/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h,: 14N: CIn file included from C/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.hL:_37A: LIn file included from G/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.hO:_14R: I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.hN:G46,: 13N:C Cwarning: L_unused function 'log2i' [-Wunused-function]P ROTO_SIMPLE) 46 | | s^t atic lo/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hn:g409 :l52o:g 2note: iexpanded from macro 'DEFINE_ncclDevFunc'( long n) { 409 | | ^~~~~ RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h: 370667: | 19 : warning: unused variable 'size' [-Wunused-variable]t id(tid), n threads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ _t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().ru n667( | w e ) ; t i| d ^( tid), nthre/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cppa:d7s:(1n:t hnote: rin instantiation of member function 'RunWork, 0, 2, 2>::run' requested heree ads), tidInBlo c7k | (DtEhFrIeNaEd_Indcxc.lxD)e,v Fgurnocu(pA(lglrRoeudpu)c,e _ T| R ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~E E _| S tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_I MPLE_PreMulS u668m | _ b f 1 6s,t enpcScilzFeu(nsctAelplSRiezdeu_c e=,= F0u n?c PnrcecMluSlhSmuemm,. choimpm_.bbfulfofaSti1z6e,s [NNCCCCLL__APLRGOOT_OT_RSEIEM,P LNEC]C/LN_CPCRLO_TSOT_ESPISM/PsLiEz)e o f| (^T ) : ste/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hp:S406i:z52e:_ )note: expanded from macro 'DEFINE_ncclDevFunc'{ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group 406 | RunWork, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here< ty>, algo, 252p | r o t o , 2P>r(i)m.irtuinv(e&sn, 667/ | * D i r etcitd=(*t/i0d,) ,P rnotthor,e a0d>s (pnrtihmrse a d| s ^) , tidInBlock(/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.ht:h565r:e5a:d Inote: din instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested herex .x), grou p565( | g r o u pr)u,n T r| e ^~~~~~~~~~~~~~~~~e UpDow/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hn:<667T:,60 :R enote: dfield 'group' will be initialized after field 'stepSize'O p, ProtoS i667m | p l e < 1t,i d1(,t iCdO)L,L _nUtNhRrOeLaLd>s,( nCtOhLrLe_aUdNsR)O,L Lt>i(daIrngBsl)o;c k (| t ^h readIdx.x), /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hg:r203o:u66p:( gnote: rin instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested hereo up), | ^~~~~~~~~~~ 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); In file included from | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp ^: 1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:7::761::18 :note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here warning: unused variable 'y' [-Wunused-variable] 776 | | D E F I N E _ n cucilnDte3v2F_utn cy(,A lhleRaedd,u cmea_nTtRiEsEs_aS;I M P| L ^E _MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(tIn file included from hr/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cppe:a2d: IIn file included from d/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hx:.10x: )In file included from ,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h :g167r: o/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hu:p667(:g15r:o upwarning: )initializer order does not match the declaration order [-Wreorder-ctor], | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 667 | 668 | t isdt(etpiSdiz)e,( snttehprSeiazdes_( n=t=h r0e a?d sn)c,c ltSihdmIenmB.lcoocmkm(.tbhurfefaSdiIzdexs.[xN)C,C Lg_rPoROuTpO(_gSrIoMuPpL)E,] / N| CC ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~L _ S| T tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_E PS/sizeof(T) :668 | s t e p Ssitzeep_S)i z{e ( s| t ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~e p S| i group(groupz e_ == 0 ? ncclShmem.comm.b/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hu:f252f:S90i:z enote: s[in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested hereN CCL_PROTO_ S252I | M P L E ] / NPCrCiLm_iStTiEvPeSs/, /*Direct=*/0,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h P:r252o:t90o:, note: 0in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here> prims | ^ 252 | Pr/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ imitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 667 | tid(tid), nthreads(nthreads), tidInBlock(thread Id/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hx.:x)222,: 19g:r ouwarning: punused variable 'size' [-Wunused-variable]( group), 222| | ^~~~~~~~~~~~~~~~~ const /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hs:s667i:z60e:_ tnote: field 'group' will be initialized after field 'stepSize' size = a r667g | s - >count; | ^~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x)/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSi,In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ ze_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group group(group), /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, pr17 warnings generated when compiling for host. oto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSi/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hze:_)667 :{15 : | warning: ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~initializer order does not match the declaration order [-Wreorder-ctor] | group(group 667 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h : 252t:i90d:( tnote: iin instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested hered ), nthreads (252n | t h r e a d sP)r,i mtitiidvIensB, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bflIn file included from oat/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp1:62,: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hN:C33C:L19_:A Lwarning: Gunused variable 'size' [-Wunused-variable]O _RING, NCC L33_ | P R O T Oc_oSnIsMtP LsEs)i z e| _^t size =/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h :370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ NCCL_PROTO_SIMP/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hL:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ E/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h]:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing ( acrognss)t; s s| i ^z e_t size = ar/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hg:s203-:>66c:o unote: ntin instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here; | ^~~~ 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWorkA,L GaOl_gToR,E Ep,r oNtCoC,L _2P>R(O)T.Or_uSnI(M&PnLcEc)l S h| m^e m.work); \/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h : 406| : ^52 : note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /NCCL_STEP/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.coS/sizeof(T) : stepSize_) m{m.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ 301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ L>().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | ( )r.urnuTnr(eweeU)p;D o w| n ^< T, RedOp, ProtoS/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cppi:m7p:l1e:< 1note: , in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here1 , COLL_UNROLL >7, | DCEOFLILN_EU_NnRcOcLlLD>e(vaFrugns)c;( A l| l ^R educe_TREE_SI/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hM:P203L:E66_:P rnote: oin instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested hered _u32, ncc l203F | u n c A l l R e dRuucneW,o rFkuEnlcePmreondt,< Funi,n tT3,2 _Rte,d ONpC,C LA_lAgLoG,O _PTrRoEtEo,, NCCOCLLL__UPNRROOTLOL_>S(I)M.PrLuEn)( w e| )^; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc'/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp :7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 409 | RunWor k7< | cDoElFlI,N Et_yn,c crleDdeovpF(,A lallRgeod,u cper_oTtRoE,E _4S>I(M)P.LrEu_nP(r&ondc_cul8S,h mnecmc.lwFournkc)A;l l\R e d| u ^c e, FuncP/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hr:o667d:,15 :u inote: nfield 'nthreads' will be initialized after field 'tidInBlock't 8_t, NCCL_ A667L | G O _ T RtEiEd,( tNiCdC)L,_ PnRtOhTrOe_aSdIsMP(LnEt)h r e| a^d s), ti/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hd:I406n:B52l:o cnote: kexpanded from macro 'DEFINE_ncclDevFunc'( threadId x.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 406 | R u7n | WDoErFkIe,d uacleg_oT,R EpEr_oStIoM,P L2E>_(M)i.nrMuanx(_&fn8c,c lnSchcmleFmu.nwcoArlkl)R;e d\u c e| , ^ FuncMinMax,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h :r667c:c15l:_ fnote: lfield 'nthreads' will be initialized after field 'tidInBlock'o at8, NCCL_AL G667O | _ T R E E,t iNdC(CtLi_dP)R,O TOn_tShIrMePaLdEs) ( n| t^h reads), /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.ht:i406d:I52n:B lnote: oexpanded from macro 'DEFINE_ncclDevFunc'c k(threadI d406x | . x ) , RgunrWoourpk(:,60 :a lgnote: ofield 'group' will be initialized after field 'stepSize', proto, 2 >667( | ) . r u nt(i&dnc(ctliSdh)m,e mn.twhorreka);d s\( n t| h ^r eads), ti/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hd:I667n:B15l:o cnote: kfield 'nthreads' will be initialized after field 'tidInBlock'( threadIdx. x667) | , g r otuipd((gtriodu)p,) ,n t h| r ^~~~~~~~~~~e ads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor]/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSizIn file included from e/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | t_ == 0 ? ncclShmem.comid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(groupm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/:*667D:i60r:e cnote: tfield 'group' will be initialized after field 'stepSize'= */0, Proto ,667 | 0 > p rtiimds( t i| d ^) , nthreads/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h(:n565t:h5r:e anote: dsin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here) , tidInBl o565c | k ( t h rreuandTIrdexe.Uxp)D,o wgnr, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown ,| group(groupC OLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here252 | Pr i203m | i t i v e s < T ,R uRneWdoOrpk,E lFeamneAnsty_,U N/R*ODLiLr>ec()t.=r*u/n0(,w eP)r;o t o| , ^0 > prims /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp| : ^7 :1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here7 | DEFINE_n c565c | l D e vrFuunnTcr(eAelUlpRDeodwuncc,e , CFOuLnLc_MUiNnRMOaLxL,> (hairpg_sb)f;l o at| 1 ^6 , NCCL_ALGO/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h_T:R203E:E66,: Nnote: Cin instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested hereC L_PROTO_S I203M | P LE ) | ^ RunWork/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hE:l409e:m52e:n tnote: p(<)t.yr>u,n (awleg)o;, p r| o ^t o, 4>().run(/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp&:n7c:c1l:S hnote: min instantiation of member function 'RunWork, 0, 2, 2>::run' requested heree m.work); \ | ^ 7 | DEFINE_/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hn:c667c:l15D:e vnote: Fufield 'nthreads' will be initialized after field 'tidInBlock'n c(AllReduc e667_ | T R E E _tSiIdM(PtLiEd_)P,r enMtuhlrSeuamd_sf(8n,t hnrcecaldFsu)n,c AtlildRIendBulcoec,k (FtuhnrcePardeIMduxl.Sxu)m,, grrcoculp_(fglrooautp8),, N C| C ^~~~~~~~~~~~~~~~~L _ALGO_T/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hR:E667E:,60 :N Cnote: CLfield 'group' will be initialized after field 'stepSize'_ PROTO_SIMP L667E | ) | ^t id(tid),/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h :n406t:h52r:e anote: dexpanded from macro 'DEFINE_ncclDevFunc's (nthreads) ,406 | t i d I nRBulnoWcokr(ktg,r oaulpg)o,, p| r ^~~~~~~~~~~o to, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | In file included from r/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cppu:n1T: rIn file included from e/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.he:U13p: DIn file included from o/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.hw:n13<: T/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h,: 76R:e18d:O p,warning: unused variable 'y' [-Wunused-variable]P rotoSimple <761 | , 1 , C O L L _uUiNnRtO3L2L_>t, yC,O LhLe_aUdN,R OmLaLn>t(iasrsgas;) ; | ^| ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpIn file included from Do/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cppw:n2<: TIn file included from ,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h :R10e: dIn file included from O/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.hp:,167 : P/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hr:o667t:o15S:i mwarning: plinitializer order does not match the declaration order [-Wreorder-ctor]e <1, 1, COLL_UNROL L667> | , C O LtLi_dU(NtRiOdL)L,> (natrhgrse)a;d s (| n ^t hreads), ti/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:d203I:n66B:l onote: ckin instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here (thread I203d | x . x) , g r o uRpu(ngWrorokuEpl)e,m e n| t ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~< Fn| , tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ T, RedOp, 668 | A l g o ,s tPerpoStioz,e (CsOtLLep_SUiNzReO_L L=>=( )0. r?u nn(cwcel)S;h m e| ^m .comm.bu/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cppf:f7S:i1z:e snote: [in instantiation of member function 'RunWork, 0, 2, 2>::run' requested hereN CCL_PROTO_SIM P7L | ED]E/FNICNCEL__nScTcElPDSe/vsFiuzneco(fA(lTl)Reduce_TREE_SIMPL E_:M isntMeapxS_iuz8e,_ )n c{c l F| u ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~n c A| l group(groupl Reduce, FuncMinMax, ui/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hn:t8252:_90t:, note: NCin instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested hereC L_ALGO_TREE ,252 | N C C L _ P RPrOiTmOi_tSiIvMePsL, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x)In file included from , /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cppg:r2o: uIn file included from p/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h(:g10r: oIn file included from u/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.hp:)167,: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h :| 667 ^~~~~~~~~~~~~~~~~: 15: warning: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hinitializer order does not match the declaration order [-Wreorder-ctor]: 667:60: note: field 'group' will be initialized after field 'stepSize' 667 | 667 | t i d (ttiidd()t,i dn)t,h rnetahdrs(enatdhsr(enatdhsr)e,a dtsi)d,I ntBildoIcnkB(ltohcrke(atdhIrdexa.dxI)d,x .gxr)o,u pg(rgoruopu(pg)r,o u p| ) ^~~~~~~~~~~, | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitivest,i d/)*,D inrtehcrte=a*d/s0(,n tPhrorteoa,d s0)>, ptriidmIsn B l| o ^c k(threadIdx/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h.:x565):,5 :g rnote: oin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested hereu p(group), 565 | | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | r tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_u nTreeUpDown< T,668 | R e d O ps,t ePprSoitzoeS(ismtpelpeS<1i,z e1_, =C=O L0L _?U NnRcOcLlLS>h,m eCmO.LcLo_mUmN.RbOuLfLf>S(iazregss[)N;C C L| _ ^P ROTO_SIMPLE]//builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hN:C203C:L66_:S Tnote: Ein instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested hereP S/sizeof( T203) | : s t e p SRiuzneW_o)r k{E l e| m ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~e n t| < group(groupFn , T, RedOp, Algo,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h :P62r:o56t:o ,note: Cin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested hereO LL_UNROL L62>( | ) . r u nP(rwiem)i;t i v| e ^s , 0, 2, 4>::run' requested herer ic<1>, 0, Pro t7o | ,D E0F>I NpEr_inmcsc l D| e ^v /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_Func(AllReduce_TREE_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threaPdRIOdTxO._xS)I,M PgLrEo)u p (| g^r oup), /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h| : ^~~~~~~~~~~~~~~~~409 :52: note: expanded from macro 'DEFINE_ncclDevFunc'/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h :667:60: 409note: | field 'group' will be initialized after field 'stepSize' RunWo r667k | < c o l lt,i dt(yt,i dr)e,d onpta,d sa(lngtoh,r epardost)o,, t4i>d(I)n.Brlounc(k&(ntchrcelaShdmIedmx..xw)o,r kg)r;o u\p ( g| r ^o up), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f64, n/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ cclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSi 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_nczclDeevsF[uNnCcC(LA_lPlRROeTdOu_cSeI_MRPILNEG]_/SNICMCPLL_ES_TPErPoSd/_sui8z,e onfc(cTl)F u:n csAtlelpRSeidzuec_e), {F u n| c ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~P r o| d group(group, uint8_t, NCCL_ALGO_RI/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hN:G301,: 90N:C Cnote: Lin instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here_ PROTO_SIMPLE) 301 | | ^ Prim/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hi:t409i:v52e:s T,Y >a,l g/o*,D iprreoctto=,* /40>,( )P.rroutno(,& n0c>c lpSrhimmesm . w| o ^r k); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hnote: :in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here667 :15: note: field 'nthreads' will be initialized after field 'tidInBlock' 565 | r u667n | T r e e UtpiDdo(wtniIn file included from d,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hI :dC10xO: .LIn file included from xL/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h)_:,U169 N: gR/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.hrO:270:oL19uL:p> ((warning: gaunused variable 'ptr' [-Wunused-variable]rr ogusp));, | | ^ ^~~~~~~~~~~~~~~~~ 270 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h : 667 :u60/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hi::n 203tnote: :6field 'group' will be initialized after field 'stepSize'664 :_ tnote: *in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here ptr =667 | r e203 c | v P tt ir d( (0 t) i+ dlR)lu,1n 2Wn8otOrhfkrfEeslaeedtms;e( nn tt| ((g)r.oruupn)(,w e )| ; ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:In file included from 667:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp15:: 1warning: : initializer order does not match the declaration order [-Wreorder-ctor]In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h: 126667: | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h : 14 : tIn file included from i/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.hd:(37t: iIn file included from d/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h):,14 : n/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:t46h:r13e:a dwarning: sunused function 'log2i' [-Wunused-function]( nthreads) ,46 | tsitdaItniBcl olcokn(gt hlroega2diI(dlxon.gx )n,) g{r o u| p ^~~~~( group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: 17 warnings generated when compiling for host. initializer order does not match the declaration order [-Wreorder-ctor] 667 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ id), nthreads(nthreads), ti/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ dInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Pri/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ mitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreaIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ ds(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | st.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h note: :in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here667 :15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 203 | RunWor kE667l | e m e n tt((t)h.rreuand(Iwdex).;x ) ,| ^g roup(group),/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp : 12| : ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~1 : | note: tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 66812 | | D E F IsNtEe_pnSciczleD(esvtFeupnSci(zAel_l R=e=d u0c e?_ RnIcNcGl_SShImMePmL.Ec_oPmrmo.db_ubfff1S6i,z ensc[cNlCFCuLn_cPARlOlTROe_dSuIcMeP,L EF]u/nNcCPCrLo_dS,T EhPiSp/_sbifzleooaft(1T6), :N CsCtLe_pASLiGzOe__R)I N{G , | N ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~C C L| _ group(groupP ROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h :note: 406in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here: 52: note: expanded from macro 'DEFINE_ncclDevFunc' 62 | P406r | i m i t iRvuensW1,> ,a l0g, oP,r optroo,t o0,> 2p>r(im)s. r u| n ^( &ncclShmem.w/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.ho:r558k:)5;: \note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here | ^ 558 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h : 667 :r15u:n Rnote: ifield 'nthreads' will be initialized after field 'tidInBlock'n g(raeragdss)(;n t h| r ^e ads), tidInBl/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.ho:c203k:(66t:h rnote: ein instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested herea dIdx.x), g203r | o u p ( g r o u pR)u,n W o| r ^~~~~~~~~~~~~~~~~k Eleme/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hn:t667<:F60n:, note: Tfield 'group' will be initialized after field 'stepSize', RedOp, Al g667o | , P r ottiod,( tCiOdL)L,_ UnNtRhOrLeLa>d(s)(.nrtuhnr(ewaed)s;) , | t ^i dInBlock(thread/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().rIund(xw.ex));, g| r ^o up(group/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp):,7 : 1| : ^~~~~~~~~~~note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hnote: :667field 'nthreads' will be initialized after field 'tidInBlock': 15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | 667 | t i dt(itdi(dt)i,d )n,t hnrtehardesa(dnst(hnretahdrse)a,d st)i,d ItniBdlIoncBkl(tohcrke(atdhIrdexa.dxI)d,x .gxr)o,u pg(rgroouupp()g,r o u| p ^~~~~~~~~~~~~~~~~) , | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h::667667:60::60 :note: field 'group' will be initialized after field 'stepSize'note: field 'group' will be initialized after field 'stepSize' 667667 | | ttiidd((ttiidd)),, nntthhrreeaaddss((nntthhrreeaaddss)),, ttiiddIInnBBlloocckk((tthhrreeaaddIIddxx..xx)),, ggrroouupp((ggrroouupp)),, | | ^~~~~~~~~~~ ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ epSize(stIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here ep 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Size_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduc/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ e,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TRE/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]E, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>()/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock/(threNaCdCILd_xS.TxE)P,S /gsriozuepo(fg(rTo)u p:) ,s t e| p ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~S i z| e tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize__ ) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | 668 group(group | stepSize(stepSize_ =/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h=: 3010: 90?: nnote: cin instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested herec lShmem.comm .301b | u f f S i z ePsr[iNmCiCtL_ivPeRsO{, /*| D ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~i r e| c group(groupt =*/0, Proto, /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h0:>252 :p90r:i mnote: sin instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here | ^ 252 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hP:r565i:m5i:t inote: vin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested heree sm,p l/e* ,0 >C OpLrLi_mUsN R O| L ^L >(args)/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h;: 565 :| 5 ^: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h : 203 :r66u:n Tnote: rin instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested heree eUpDownAs,li gzCoeO,_L tLP _rsUoiNtzRoOe,L L=C> O(aLarLrg_gsUs-N)>;Rc Oo Lu| Ln ^>t (;) . r| u ^~~~n (we/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h):;203 /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h ::| 66371 ^: :15 :note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested herewarning: 203/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp | : 7 : 1 : note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here RunWorkElement <7 | FDnE,F ITN,E _RnecdcOlpD,e vAFlugnoc,( APlrloRtedou,c eC_OTLRLE_EU_NSRIOMLPLL>E(_)P.rreuMnu(lwSeu)m;_ f 1| 6 ^, ncclFunc/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cppA:l7l:R1e:d unote: cin instantiation of member function 'RunWork, 0, 2, 4>::run' requested heree , FuncPreMu l7S | uDmE, FhIaNlEf_,n cNcClCDLe_vAFLuGnOc_(TARlElER,e dNuCcCeL__TPRREOET_OS_ISMIPMLPEL_ES)u m _| b^f 16, nccl/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hF:u406n:c52A:l lnote: Reexpanded from macro 'DEFINE_ncclDevFunc'd uce, Func S406u | m , h iRpu_nbWfolroka,, NaClCgLo_,P RpOrToOt_oS,I M2P>L(E)). r u| n^( &ncclSh/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hm:e409m:.52w:o rnote: kexpanded from macro 'DEFINE_ncclDevFunc') ; \ | ^ 409 | RunW/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.ho:r667k:<15c:o lnote: lfield 'nthreads' will be initialized after field 'tidInBlock', ty, redop | , a l tgiod,( tpirdo)t,o ,n t4h>r(e)a.drsu(nn(&tnhcrcelaSdhsm)e,m .twiodrIkn)B;l o\c k (| t ^h readIdx./builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hx:)667,: 15g:r onote: ufield 'nthreads' will be initialized after field 'tidInBlock'p (group), 667| | ^~~~~~~~~~~~~~~~~ tid(/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.ht:i667d:)60,: nnote: thfield 'group' will be initialized after field 'stepSize'r eads(nthre a667d | s ) , ttiiddI(ntBildo)c,k (ntthhrreeaaddIsd(xn.txh)r,e agdrso)u,p (tgirdoIunpB)l,o c k| ( ^~~~~~~~~~~~~~~~~t hrea/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hd:I667d:x60.:x )note: ,field 'group' will be initialized after field 'stepSize' group(g r667o | u p ) , t i| d ^~~~~~~~~~~( tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ .run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 667/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h | :222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NC/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor]C L_ALGO_TREE, N C667C | L _ P R OtTiOd_(StIiMdP)L,E )nt h r| e^a ds(nthread/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hs:),409 :t52i:d Inote: nexpanded from macro 'DEFINE_ncclDevFunc'B lock(threa d409I | d x . x )R,u ngWroorupk(, algo, 668p | r o t os,t e4p>S(i)z.er(usnt(ep&Sniczcel_S h=m=e m0. w?o rnkc)cl;S h\m e m| . ^c omm.buffS/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hi:z667e:s15[:N Cnote: Cfield 'nthreads' will be initialized after field 'tidInBlock'L _PROTO_SIM P667L | E ] / N CCtLi_dS(TtEiPdS)/,s inztehorfe(aTd)s :( nstthepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | r group(groupe ads), tidInBlock/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h(:t301h:r90e:a dnote: Iin instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested hered x.x), gr o301u | p ( g r o uPpr)i,m i t| i ^~~~~~~~~~~~~~~~~v esa, d/s*(Dnitrherceta=d*s/)0,, PtriodtIon,B l0o>c kp(rtihmrse a d| ^I dx.x), grou/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hp:(565g:r5o:u pnote: )in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here, | ^~~~~~~~~~~ 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEF ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~IN E _| n group(groupc clDevFunc(AllReduce/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h_:T62RE:E56_:S Inote: Min instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested hereP LE_Prod_b f621 | 6 , n cPcrliFmuintciAvlelsRt,1 60,, NPCrCoLt_oA,L G0O>_ TpRrEiEm,s N C| C ^L _PROTO_SIMP/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hL:E558): 5 :| ^note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h: 409558: | 52 : note: expanded from macro 'DEFINE_ncclDevFunc'r unRingo(pa),; a l| g ^o , proto, 4>(/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h):.203r:u66n:( ¬e: ncin instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nt/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hhr:e667a:d15s:( nwarning: tinitializer order does not match the declaration order [-Wreorder-ctor]h reads), tidInBloc k667( | t h r e atdiIdd(xt.ixd)),, gnrtohurpe(agdrso(unpt)h,r e a| d ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~s ) ,| tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_t idInBlock(th re668a | d I d x .sxt)e,p Sgirzoeu(ps(tgerpoSuipz)e,_ =| = ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ 0 | ? tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ ncclShmem.co m668m | . b u f fsStiepzSeisz[eN(CsCtLe_pPSRiOzTeO__ S=I=M P0L E?] /nNcCclCSLh_mSeTmE.PcSo/msmi.zbeuofff(STi)z e:s [sNtCeCpLS_iPzReO_T)O _{S IM P| L ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~E ] /| N group(groupC CL_STEPS/sizeof(T)/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h ::252 :s90t:e pnote: Sin instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested herei ze_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 252| | group(group Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested herea nAsymmetric< N301C | C L _ M A XP_rDiEmVi_tAiRvIeTsY<,T ,1 >R,ed O/p*,D iFraencAts=y*m/m0e,t rPircoC Lp_rMAiXm_sD E V| _ ^A RITY>, /*Di/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hre:c565t:=5*:/0 ,note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested hereP roto, 0> p565r | i m s r| u ^n TreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here ProtoSimpl e565< | 1 , 1 ,r unCTOrLeLe_UUpNDRoOwLnL<>T,, CROeLdLO_pU,N RPOrLoLt>o(Sairmgpsl)e;< 1 ,| ^1 , COLL_UNRO/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hL:L>203,: 66C:O Lnote: Lin instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here_ UNROLL>(a r203g | s ) ; | ^ RunWorkEleme/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hn:t203<:F66n:, note: Tin instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here, RedOp, A l203g | o , P r o t oR,u nCWOoLrLk_EUlNeRmOeLntL<>F(n),. rTu,n (Rweed);O p ,| ^A lgo, Proto/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp,: 7C:O1L:L _note: Uin instantiation of member function 'RunWork, 0, 2, 4>::run' requested hereN ROLL>().run (7w | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TRE/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hE,: N667C:CL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ e); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMin15Ma:x ,warning: initializer order does not match the declaration order [-Wreorder-ctor]u int8_t, NCCL_ALGO_T R667E | E , N CtCiLd_(PtRiOdT)O,_ SnItMhPrLeEa)d s (| n^t hreads),/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h :t406i:d52I:n Bnote: lexpanded from macro 'DEFINE_ncclDevFunc'o ck(thread I406d | x . x ) ,R ugnWroorukp<(cgorlolu,p )t,y , r| e ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~d o p| < tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_t y>, algo, pro t668o | , 2 > (s)t.erpuSni(z&en(csctleSphSmiezme._w o=r=k )0; ?\ n c| c ^l Shmem.comm/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h.:b667u:f15f:S inote: zfield 'nthreads' will be initialized after field 'tidInBlock'e s[NCCL_PROT O667_ | S I M P LtEi]d/(NtCiCdL)_,S TnEtPhSr/esaidzse(onft(hTr)e a:d ss)t,e ptSiidzIen_B)l o{c k( t| h ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~r e a| d group(groupI dx.x), group(group),/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h : 301| : ^~~~~~~~~~~~~~~~~90 : note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 301 | P r667i | m i t i vteisd<(Tt,i dR)e,d Onpt,h rFeaandAss(ynmtmherteraidcs<)1,, tNiCdCILn_BMlAoXck_(DtEhVr_eAaRdIITdYx>.,x )/,* Dgirroeucpt(=g*r/o0u,p )P,r o t| o ^~~~~~~~~~~, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ clShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~: 667| : group(group15 : warning: initializer order does not match the declaration order [-Wreorder-ctor] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: 667in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here | tid(tid) ,301 | n t h r e a dPsr(inmtihtrievaedss<)T,, tRieddIOnpB,l oFcakn(AtshyrmemaedtIrdixc. , | / tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_* Direct=*/0, P668r | o t o , s0t> epprSiimzse (| s ^t epSize_ == 0/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h :?565 :n5c:c lnote: Sin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested hereh mem.comm. b565u | f f S i zreusn[TNrCeCeLU_pPDRoOwTnO<_TS,I MRPeLdEO]p/,N CPCrLo_tSoTSEiPmSp/lsei_,) C{O L L| _U ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~N R O| L group(groupL >(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing<(nthreads), tidInBlock(thT, RedOp, Proto, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ readIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads),In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShm_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ em.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | In file included from ru/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f64.cppn:Tr1e: eIn file included from U/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hp:D17o: wIn file included from n/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h<:T11,: In file included from R/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.he:d12O: pIn file included from ,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h :P126r: oIn file included from t/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.ho:S14: iIn file included from m/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.hp:l37e: , COLL_U N46R | OLsLt>a(taircgs); | ^ OL/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hL:>203(:)66.:r unote: n(in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested herew e); | ^ 203 | RunWork/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cppE:l7e:m1e:n tnote: , 0, 2, 4>::run' requested hereF n, T, RedOp, A7l | gDoE,F IPNrEo_tnoc,c lCDOeLvLF_uUnNcR(OALlLl>R(e)d.urcuen_(TwReE)E;_ S I| M ^P LE_PreMulSum_/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cppf:176:,1 :n cnote: cin instantiation of member function 'RunWork, 0, 2, 4>::run' requested herelF uncAllReduc e7, | DFEuFnIcNPEre_MnuclcSluDme,v Fhuanlcf(,A llNRCeCdL_uAcLeG_OT_RTEREE_E,S INMCPCLL_EP_RPOrTO_SIMPLE) | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp409::252: :In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hnote: :expanded from macro 'DEFINE_ncclDevFunc'10 : In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270 :19409: | warning: unused variable 'ptr' [-Wunused-variable] RunWork6,4 _atl*g op,t rp r=o troe,c v4P>t(r)(.0r)u+nl(l&1n2c8cOlfSfhsmeetm;. w o| r ^~~k ); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ eMu l668S | u m _ f 8s,t enpcScilzFeu(nsctAelplSRiezdeu_c e=,= F0u n?c PnrcecMluSlhSmuemm,. crocmcml._bfulfofSaitz8e,s [NNCCCCLL__APLRGOOT_OT_RSEIE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ long log2i(long n) { | ^~~~~ MPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreadsIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h: 33667: | 19 : warning: unused variable 'size' [-Wunused-variable]t id(tid), nt h33r | e a d s (cnotnhsrte asdssi)z,e _tti dsIinzBel o=c ka(rtghsr-e>acdoIudnxt.;x ) ,| ^~~~g roup(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDowncount; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ L>, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TRE/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ E, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h, F:un667c:M15i:n Mawarning: xinitializer order does not match the declaration order [-Wreorder-ctor], uint8_t, NCCL_ALGO_ T667R | E E , NtCiCdL(_tPiRdO)T,O _nStIhMPrLeEa)d s (| n^ threads/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h):,409 :t52i:d Inote: nexpanded from macro 'DEFINE_ncclDevFunc'B lock(thr e409a | d I d x .Rxu)nW,o rgkr, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ oSimple<1, 1, COLL_UNROLL>, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bfL8,L _UnNcRcOlLFLu>n,c AClOlLRLe_dUuNcReO,L LF>u(nacrPgsr)e;M u l| S ^u m, rccl_bfloat8,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h :N203C:C66L:_ Anote: Lin instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested hereG O_TREE, N C203C | L _ P R O T O _ SRIuMnPWLoEr)k E l| e^m ento(l)l.,ru nt(yw,e )r;e d o| p ^< ty>, algo, /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cppp:r7o:t1o:, note: 4in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here> ().run(&ncclS h7m | eDmE.FwIoNrE_kn)c;c l\D e v| F ^u nc(AllRed/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hu:ce667_:T15:R Enote: Efield 'nthreads' will be initialized after field 'tidInBlock'_ SIMPLE_Pre M667u | l S u m _tfi6d4(,t indc)c,l FnutnhcrAelaldRse(dnutcher,e aFdusn)c,P rteiMduIlnSBulmo,c kd(otuhbrleea,d INdCxC.Lx_)A,L GgOr_oTRuEpE(,g rNoCuCpL)_,P R O| T ^~~~~~~~~~~~~~~~~O _SIMPLE/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h): 667 :| 60^: note: field 'group' will be initialized after field 'stepSize' /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: 667note: | expanded from macro 'DEFINE_ncclDevFunc' tid(t i406d | ) , n tRhunrWeoardks<(cnotlhlr,e atdys,) ,r etdiodpIo,c ka(ltghor,e apdrIodtxo.,x 2)>,( )g.rrouunp((&gnrcoculpS)h,m e m| . ^~~~~~~~~~~w ork); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROT/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), n/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads)O,_ StIiMdPILnEB]l/oNcCkC(Lt_hSrTeEaPdSI/dsxi.zxeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElementh(r)e.arduInd(xw.ex));, g| r ^o up(group), /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp :| 7 ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~: 1 :| tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 668 | 7 | D E FsItNeEp_Sniczcel(DsetveFpuSnicz(eA_l l=R=e d0u c?e _nTcRcElES_hSmIeMmP.LcEo_mmP.rbeuMfuflSiSzuems_[fN3C2C,L _nPcRcOlTFOu_nScIAMlPlLREe]d/uNcCeC,L _FSuTnEcPPSr/esMiuzleSoufm(,T )f l:o astt,e pNSCiCzLe__A) LG{O _ T| R ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ E E| , group(group NCCL_PROTO_SIMPL/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hE:)62 : 56| :^ note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406: 5262: | note: expanded from macro 'DEFINE_ncclDevFunc' Primiti v406e | s < T , RRuendWOopr,k p,< t0y,> ,P raoltgoo,, 0p>r optroi,m s2 > (| ) ^. run(&ncclShm/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.he:m558.:w5o:r knote: )in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here; \ | ^ 558 | run/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hR:i667n:g15<:T ,note: field 'nthreads' will be initialized after field 'tidInBlock'R edOp, Proto, 667C | O L L _ UtNiRdO(LtLi>d()a,r gnst)h;r e a| d ^s (nthreads), ti/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hdI:n203B:l66o:c knote: (in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested heret hreadIdx. x203) | , g r o u p ( gRruonuWporkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here ), group( g12r | oDuEpF)I,N E _| n ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~c c l| D tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_e vFunc(AllReduc e668_ | R I N G _sStIeMpPSLiEz_eP(rsetMeuplSSiuzm_eb_f 1=6=, n0c c?l FnucncclASlhlmReemd.uccoem,m .FbuunfcfPSriezMeusl[SNuCmC,L _hPiRpO_TbOf_lSoIaMtP1L6E,] /NNCCCCLL__ASLTGEOP_SR/IsNiGz,e oNfC(CTL)_ P:R OsTtOe_pSSIiMzPeL_E) ){ | ^| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h: 62409: | 56 : note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested hereR unWorkT,, aRlegdoO,p ,p rFoatnSoy,m m4e>t(r)i.cr(,& n0c,c lPSrhomteom,. w0o>r kp)r;i m\s | | ^ ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h15::558 :note: 5field 'nthreads' will be initialized after field 'tidInBlock': note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 667 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElementcount; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ ), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads),L tLi_dUINnRBOlLoLc>k(()t.hrruena(dwIed)x;. x )| , ^ group(group), | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp ^~~~~~~~~~~: 12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | | t itdi(dt(itdi)d,) ,n tnhtrheraedasd(sn(tnhtrheraedasd)s,) ,t itdiIdnIBnlBolcokc(kt(htrheraeaddIIddxx..xx)),, ggrroouupp((ggrroouupp)),, | | ^~~~~~~~~~~~~~~~~ ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h::667:667:6060:: note: note: field 'group' will be initialized after field 'stepSize'field 'group' will be initialized after field 'stepSize' 667667 | | ttiidd((ttiidd)),, nntthhrreeaaddss((nntthhrreeaaddss)),, ttiiddIInnBBlloocckk((tthhrreeaaddIIddxx..xx)),, ggrroouupp((ggrroouupp)), , | ^~~~~~~~~~~| ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(gro/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hup:)667,: 15 :| ^~~~~~~~~~~~~~~~~ warning: initializer order does not match the declaration order [-Wreorder-ctor] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | 667 | t i tidd((ttiidd)),, nntthhrreeaaddss((nntthhrreeaaddss)),, ttiiddIInnBBlloocckk((tthhrreeaaddIIddxx..xx)),, ggrroouupp((ggrroouupp)),, | | ^~~~~~~~~~~ ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | steIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ pSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor]12 | DEFINE_ncclDevFunc(A l667l | R e d u ctei_dR(ItNiGd_)S,I MnPtLhEr_eMaidnsM(anxt_hfr8e,a dnsc),c ltFiudnIcnABllloRcekd(utcher,e aFduIndcxM.ixnM)a,x ,g rrocucpl(_gfrloouapt)8,, N| C ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~C L _A| L tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_G O_RING, NC C668L | _ P R O TsOt_eSpISMiPzLeE()s t e| p^S ize_ ==/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h :0406: 52?: nnote: cexpanded from macro 'DEFINE_ncclDevFunc'c lShmem .406c | o m m .RbuunfWfSoirzke],/ NaClCgLo_, SpTroEtPoS,/ si2z>e(o)f.(rTu)n (:& nsctcelpSShimzeem_.)w o{r k )| ; ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ \ | group(group| ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock'/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h :62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 667 | t62i | d( t i d )P,r inmtihtrievaedss<(Tn,t hRreedaOdps,) ,F atniSdyImnmBeltorcikc(r,e a0d,I dPxr.oxt)o,, g0r>o uppr(igmrso u p| ) ^, | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h::667558::605:: note: note: field 'group' will be initialized after field 'stepSize'in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | 667 | r utniRdi(ntgi(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nth/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hrea:d667s(:n15t:h rwarning: eainitializer order does not match the declaration order [-Wreorder-ctor]d s), tidInBlock(thre a667dI | d x . x )t,i dg(rtoiudp)(,g rnotuhpr)e,a d s| ( ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~n t h| r tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_e ads), tidInB l668o | c k ( t hsrteeapdSIidzxe.(xs)t,e pgSriozuep_( g=r=o u0p )?, n c| c ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~lS h m| e tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_m .comm.buffSi z668e | s [ N C CsLt_ePpRSOiTzOe_(SsItMePpLSEi]z/eN_CC L=_=S T0E P?S /nsciczleSohfm(eTm). c:o msmt.ebpuSfifzSei_z)e s{[ N C| C ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~L _ P| R group(groupO TO_SIMPLE]/N/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hC:C62L:_56S:T Enote: Pin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested hereS /sizeof (62T | ) : PsrtiempiStiizvee_s)< T{, R e| d ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~O p ,| group(group FanSymmetric<1>/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h,: 620:,56 :Pr otnote: oin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here, 0> pri m62 | s | ^P rimitives/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h<:T558,: 5R:e dnote: Oin instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested herep , FanS y558m | m e t r ircui,n g0<,T ,P rRoetdoO,p ,0 P>r optroi,m sC OL L| _ ^U NROLL>(arg/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hs:)558:;5 : | note: ^in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h :r203u:n66R:i nnote: g(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hth:r667e:a15d:I dwarning: x.initializer order does not match the declaration order [-Wreorder-ctor]x ), group(group), | ^~~~~~~~~~~667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h: 667406: | 15 : warning: initializer order does not match the declaration order [-Wreorder-ctor]R unWorki,d (atligdo),, pnrtohtroe,a d2s>((n)t.hrruena(d&sn)c,c ltSihdmIenmB.lwoocrkk()t;h r\e a d| I ^d x.x), gro/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hu:p667(:g15r:o unote: pfield 'nthreads' will be initialized after field 'tidInBlock') , | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 667 | tid( tid), nthreads(nt668hr | e a d s )s,t etpiSdiIzneB(lsotcekp(Stihzree_a d=I=d x0. x?) ,n cgcrloSuhpm(egmr.ocuopm)m,. b u| f ^~~~~~~~~~~~~~~~~f Sizes/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h[:N667C:C60L:_ Pnote: Rfield 'group' will be initialized after field 'stepSize'O TO_SIMPLE] /667N | C C L _ StTiEdP(St/isdi)z,e onft(hTr)e a:d ss(tnetphSirzeea_d)s ){, t| i ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~d I n| B group(groupl ock(threadIdx.x)/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h,: g252r:o90u:p (note: gin instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested herer oup), | ^~~~~~~~~~~ 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: duce_RING_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllRe/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hdu:c667e:,15 :F uwarning: ninitializer order does not match the declaration order [-Wreorder-ctor]cM inMax, floa t667 | , N C CtLi_dA(LtGiOd_)T,R EnEt,h rNeCaCdLs_(PnRtOhTrOe_aSdIsM)P,L Et)i d I| n^B lock(th/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hr:e406a:d52I:d xnote: .expanded from macro 'DEFINE_ncclDevFunc'x) , grou p406( | g r o u pR)u,n W o| r ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~k< c o| l tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_l , ty, red o668p | < t y > ,s tealpSgoi,z ep(rstotepoS,i z2e>_( )=.=r u0n (?& nnccccllSShhmmeemm..wcoormkm).;b u\f f S| ^i zes[NCCL/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h_:P667R:O15T:O _note: Sfield 'nthreads' will be initialized after field 'tidInBlock'I MPLE]/NCCL _667S | T E P S /tsiidz(etoifd()T,) n:th rsetaedpsS(inztehr_e)a d{s ) ,| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~t i d| I group(groupn Block(threadIdx.x),/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h :g301r:o90u:p (note: gin instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested herer oup), | ^~~~~~~~~~~~~~~~~ 301 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h : 667 :P60r:i mnote: ifield 'group' will be initialized after field 'stepSize't ivesB,l o/c*kD(itrherceta=d*Id/x0.,x )P,r ogtroo,u p0(>g rporuipm)s, | | ^ ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.ha:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ o, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ (nthreads), tidInB| group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ lock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h,: 12C: OIn file included from L/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.hL:_126U: NIn file included from RO/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.hL:L14>: (In file included from a/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.hr:g37s: )In file included from ;/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h : 14| : ^/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h :46:13: warning: unused function 'log2i' [-Wunused-function] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66 : 46note: | in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested heres tatic lon g203 | l o g 2 i ( l o nRgu nnW)o r{k E l| e ^~~~~m ent().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u8, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ threads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), ti/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ dInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(ar/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ gs); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().ruIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ n(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncc warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ lDevFunc(AllReduce_RING_SIMPLE_Prod_f32, ncclFuncAllRed/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u8, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ uce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads),/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(In file included from group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 6 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(l:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ong n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_bf16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u32, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? nc17 warnings generated when compiling for host. clShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), grou/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hp(:g667r:o15u:p ),warning: initializer order does not match the declaration order [-Wreorder-ctor] | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 667 | 668 | t i ds(tteipdS)i,z en(tshtreepaSdisz(en_t h=r=e a0d s?) ,n ctcildSIhnmBelmo.ccko(mtmh.rbeuafdfISdixz.exs)[,N CgCrLo_uPpR(OgTrOo_uSpI)M,P L E| ] ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~/ N C| C tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_L _STEPS/sizeo f668( | T ) : sstteeppSSiizzee(_s)t e{p S i| z ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~e _| group(group= = 0 ? ncclShme/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:m62.:c56o:m mnote: .in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested herebu ffSize s62[ | N C C L _PPrRiOmTiOt_iSvIeMsP:, s0t, ePprSoitzoe,_ )0 >{ p | r ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ im s| group(group | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h558::2525::90 :note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested herenote: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 558 | r252u | n R i n g < TP,r ReidmOipt,i vPersoy(mamregtsr)i;c < N| C ^C L_MAX_DEIn file included from V_/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf16.cppA:RI1/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hT: :YIn file included from 203,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h: :66117:>: ,In file included from note: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h/in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here:* 11D: iIn file included from r/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.he:c12t: =In file included from */builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h /:2030126 | ,: In file included from P/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h r: 14o t: In file included from o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h, : R370u: >nIn file included from W/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.hpo:rr14ik: mE/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.hls:e 46m :e| 13n ^:t , ProtoSimple<1, 1, 4>, 4>' requested heret iPcr oltoon,g ClO oL565gL | 2_ iU (N lR oOnrLguLn >Tn(r))e .e{rU up nD| ( ^~~~~ow wen)<;T , | R ^e dOp, ProtoSim/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cppp:le12<:11,: 1note: ,in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here COLL_UNROLL>, C12O | LDLE_FUINNREO_LnLc>c(laDregvsF)u;n c (| A ^l lReduce_RING/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ , ncc/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hl:F667u:n15c:A lnote: lfield 'nthreads' will be initialized after field 'tidInBlock'R educe, Fun c667M | i n M a xt,i df(ltoiadt),, NnCtChLr_eAaLdGsO(_nTtRhErEe,a dNsC)C,L _tPiRdOITnOB_lSoIcMkP(LtEh)r e a| d^I dx.x), gr/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.ho:u409p:(52g:r ounote: pexpanded from macro 'DEFINE_ncclDevFunc') , | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h409: | 667 : 60 : Rnote: ufield 'group' will be initialized after field 'stepSize'n Work ,n tahlrgeoa,d sp(rnotthor,e a4d>s()),. rtuind(I&nnBclcolcSkh(mtehmr.ewaodrIkd)x;. x\) , | g ^r oup(grou/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hp:)667,: 15 :| ^~~~~~~~~~~note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.ha:rg667s:)15;: warning: | initializer order does not match the declaration order [-Wreorder-ctor] ^ 667 | tid(t/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hid:)203,: 66n:t hrnote: ein instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested herea ds(nthreads) ,203 | t i d I n B l o cRku(ntWhorrekaEdlIedmxe.nxt)<,F ng,r oTu,p (RgerdoOupp,) ,A l g| o ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~, P| r tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_o to, COLL_UNR O668L | L > ( ) .srtuenp(Swiez)e;( s t| e ^p Size_ == 0 ? /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cppn:c12c:l1S:h mnote: ein instantiation of member function 'RunWork, 1, 2, 4>::run' requested herem .comm.buffSi z12e | sD[ENFCICNLE__nPcRcOlTDOe_vSFIuMnPcL(EA]l/lNRCeCdLu_cSeT_ERPISN/Gs_izSeIoMfP(LTE)_ S:u ms_tbefp1S6i,z en_c)c l{F un c| A ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~l l R| e group(groupd uce, FuncSum, /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hh:i252p:_90b:f lnote: oain instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested heret 16, NCCL_ A252L | G O _ R I N GP,r iNmCiCtLi_vPeRsOW,o r/k*0,> aplrgiom,s p r| o ^t o, 4>()/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h.:r565u:n5(:& nnote: cin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested herecl Shmem.w o565r | k ) ; \r u n| T ^r eeUpDowna,d sC(OnLtLh_rUeNaRdOsL)L,> (tairdgIsn)B;l o c| k ^( threadId/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hx:.203x:)66,: gnote: rin instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested hereo up(group )203, | | ^~~~~~~~~~~~~~~~~ Run/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hW:o667r:k60E:l enote: mfield 'group' will be initialized after field 'stepSize'e nt)(,) .triudInn(Bwleo)c;k ( t| h ^r eadIdx.x), /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cppg:r7o:u1p:( gnote: rin instantiation of member function 'RunWork, 0, 2, 4>::run' requested hereo up), | ^~~~~~~~~~~ 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h222::20319::66 :warning: note: unused variable 'size' [-Wunused-variable]in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 222203 | | c o n s tR usnsWiozrek_Etl esmieznet <=F na,r gTs,- >RceoduOnpt,; A l| g ^~~~o , Proto, COLL_UNROLL>().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h);: 370 :| 19 ^: warning: unused variable 'size' [-Wunused-variable] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp :37012 | : 1 : note: cin instantiation of member function 'RunWork, 1, 2, 2>::run' requested hereo nst ssize_t s12i | zDeE F=I NaEr_gnsc-c>lcDoeuvnFtu;n c (| A ^~~~l lRed/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hu:c371e:_15R:I Nwarning: Gunused variable 'bid' [-Wunused-variable]_ SIMPLE_ P371r | o d _ f 8c,o nnsctc liFnutn cbAildl R=e dgurcied,O fFfusnectP r/o dc,h arncncell_Cfoluonatt;8 , | N ^~~C CL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_In file included from SI/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cppM:PL1E: ]In file included from //builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hN:C17C: LIn file included from _/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.hS:T11E: PIn file included from S/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h/:s12i: zIn file included from e/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.ho:f126(: TIn file included from )/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h ::14 : sIn file included from t/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.he:p37S: iIn file included from z/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.he:_14): /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h{: 46 :| 13 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~: warning: | group(groupunused function 'log2i' [-Wunused-function] 46 | sta/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.ht:i62c: 56l:o nnote: gin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here log2i(lo n62g | n ) {P r i| m ^~~~~i tives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ id), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ Size(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ 17 warnings generated when compiling for host. | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tid/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hIn:B667l:o15c:k (twarning: hinitializer order does not match the declaration order [-Wreorder-ctor]r eadIdx.x), group(g ro667u | p ) , t| i ^~~~~~~~~~~d (tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h: :/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h62::3356::19 :note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested herewarning: unused variable 'size' [-Wunused-variable] 62 | 33 | P r icmointsitv essstcroiucn , | 0 ^~~~, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667 :66815 | : warning: initializer order does not match the declaration order [-Wreorder-ctor] stepSize(stepSize_ 667= | = 0 ?t indc(cltSihdm)e,m .nctohmrme.abdusf(fnSitzherse[aNdCsC)L,_ PtRiOdTIOn_BSlIoMcPkL(Et]h/rNeCaCdLI_dSxT.ExP)S,/ sgirzoeuopf((gTr)o u:p )s,t e p| S ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~i z e| _ tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group 668 | stepSize(s/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.ht:e62p:S56i:z enote: _in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here == 0 ? 62n | c c l S hPmreimm.ictoimvme.sbE,] /0N,C PCrLo_tSoT,E P0S>/ spirziemso f (| T ^) : stepSize_/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h): 558{: 5 :| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here | group(group 558 | runRin/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hg:<252T:,90 :R enote: dOin instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested herep , Proto, COL L252_ | U N R O LL > (Parrigmsi)t;i v e| ^s , 1, 2, 2>::run' requested herei cor,k E/l*eDmiernetcg op,r iPmrso t o| , ^ COLL_UNROLL>()/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h.:ru565n:(5w:e )note: ;in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here | ^ 565 | runT/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cppr:e12e:U1p:D onote: win instantiation of member function 'RunWork, 1, 2, 2>::run' requested heren c,e _CROILNLG__USNIRMOPLLLE>_(MairngMsa)x;_ u 8| , ^ ncclFuncAllRe/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hd:u203c:e66,: Fnote: unin instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested herec MinMax, 203u | i n t 8 _ t , NRCuCnLW_oArLkGEOl_eRmIeNnGt,< FNnC,C LT_,P RROeTdOO_pS,I MAPlLgEo), P r| o^t o, COLL/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h_:U406N:R52O:L Lnote: >expanded from macro 'DEFINE_ncclDevFunc'( ).run(w e406) | ; | R ^u nWork, 0, 2, 4>::run' requested hereo p, algo ,7 | pDrEoFItNoE,_ n2c>c(l)D.ervuFnu(n&cn(cAclllSRhemdeumc.ew_oTrRkE)E;_ S\I M P| L ^E _PreMulS/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hu:m667_:f153:2 ,note: field 'nthreads' will be initialized after field 'tidInBlock'n cclFuncA l667l | R e d u ctei,d (Ftuidn)c,P rnetMhurleSaudms,( nftlhoraeta,d sN)C,C Lt_iAdLIGnOB_lToRcEkE(,t hNrCeCaLd_IPdRxO.TxO)_,S IgMrPoLuEp)( g r| o^u p), | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h ^~~~~~~~~~~~~~~~~: 409:52: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hnote: :expanded from macro 'DEFINE_ncclDevFunc'667 :60: note: field 'group' will be initialized after field 'stepSize' 409 | R u667n | W o r k n,t harlegaod,s )p,r ottiod,I n4B>l(o)c.k(rtuhnr(e&andcIcdlxS.hxm)e,m .gwrork)o; u\p( g r| o ^u p), | ^~~~~~~~~~~/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h :667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims 17 | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | [ 68%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/broadcast_sum_i8.cpp.o RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/broadcast_sum_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/broadcast_sum_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/broadcast_sum_i8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 37 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STE17PS warning/ss generatedi when compiling for hostz. eof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ L_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidIIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ nBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ S/sizeof(T) In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ric<1>, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRingcount; | ^~~~ dOp, Proto, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(A/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hl:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ lReduce_RING_SIMPLE_Prod_u32, ncclFuncAllReduce, FuncProd, uin/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(t32_t, NCCgroup), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(thread[ 68%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/device_table.cpp.o L_ALGO_RING, NCCLIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/device_table.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/device_table.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/device_table.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/device_table.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _PROTO_SIMPLE) In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(thread/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_bf8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Idx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558In file included from | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp :2 : rIn file included from un/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hR:i10n: gIn file included from (140a | r g s ) ;u i n| t ^3 2_t data1, fl/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.ha:g2031:,66 :d anote: tin instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested herea 2, flag2; 203 | | ^~~~~ R/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hu:nWorkElement ( )u.inrutn3(2w_et) ;d a t| a ^1 , flag1, dat/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cppa:212,: 1f:l anote: gin instantiation of member function 'RunWork, 1, 2, 4>::run' requested here2 ; | ^~~~~ 12 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hD:E140F:I28N:E _warning: nunused variable 'data2' [-Wunused-variable]c clDevFun c140( | A l l R eudiuncte3_2R_ItN Gd_aStIaM1P,L Ef_lMaign1M,a xd_atua82,, nfccllaFgu2n;c A l| l ^~~~~R educe/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h,: 140F:u35n:c Mwarning: iunused variable 'flag2' [-Wunused-variable]n Max, u i140nt | 8 _ t ,u iNnCtC3L2__AtL GdOa_tRaI1N,G ,f lNaCgC1L,_ PdRaOtTaO2_,S IfMlPaLgE2); | ^| ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ = recvPtr(0)+ll128OffIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ set; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ :222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable]/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 667 | 222 | t i d (ctoinds)t, snstihzree_atd ss(inzteh r=e aadrsg)s,- >tcioduInntB;l o c| k ^~~~( threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCou/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ nt; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37In file included from : In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h::370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; 126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthread17 warnings generated when compiling for host. s), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, prIn file included from oto/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp,: 22: >In file included from (/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h):.r10u: nIn file included from (/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h&:n168c: c/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hl:Sh140m:e14m:. wwarning: ounused variable 'data1' [-Wunused-variable]r k); \ | ^ 140 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h :u667i:n15t32_t data:1 ,note: ffield 'nthreads' will be initialized after field 'tidInBlock'l ag1, data2, 667f | l a g 2 ;t i d| ( ^~~~~t id), nth/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hr:e140a:d21s:( nwarning: tunused variable 'flag1' [-Wunused-variable]h reads), t140i | d I n B luoicnkt(3t2h_rte addaItdax1.,x )f,l aggr1o,u pd(agtrao2u,p )f,l a g| 2 ^~~~~~~~~~~~~~~~~; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h60::140 note: :field 'group' will be initialized after field 'stepSize'28: warning: unused variable 'data2' [-Wunused-variable] 667 | 140 | t iudi(ntti3d2)_,t ndtahtrae1a,d sf(lnatgh1r,e addasta),2 ,t ifdlIangB2l;o c k| ( ^~~~~t hreadI/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hd:x.140x:)35,: gwarning: runused variable 'flag2' [-Wunused-variable]o up(grou p140) | , | ^~~~~~~~~~~u int32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | In file included from c/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] onst ssize_t size = args->count; | ^~~~ 46 | static long log2i(l/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hon:g 370n:)19 :{ warning: | unused variable 'size' [-Wunused-variable] ^~~~~ 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), 17 warnings generated when compiling for host. | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize17 warnings generated when compiling for host. _ == 0 ? In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDownIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ , COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threaunWork,dIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid) a, nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ lgo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ InBlock/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2,17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | ste/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here pSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PR 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ OTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepS/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h17 warnings generated when compiling for host. :62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWoIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ rkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f64, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | t/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduceIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ _TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_u64, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_f32, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives ,warning: initializer order does not match the declaration order [-Wreorder-ctor]/ *Direct=*/0, Proto ,667 | 0 > p rtiimds( t i| d ^) , nthreads(nthreads/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h):,565 :t5i:d Inote: nin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested hereB lock(threa d565I | d x . x )r,u ngTrroeuepU(pgDroowunp<)T,, R e| d ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~O p ,| tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_P rotoSimple<1 ,668 | 1 , C OsLtLe_pUSNiROzLeL(>s,t eCpOSLiLz_eU_N =R=O L0L >?( anrcgcsl)S;h m e| m ^. comm.buffSiz/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.he:s203[:N66C:C Lnote: _in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested hereP ROTO_SI M203P | L E ] / N C C L _RSuTnEWPoSr/ksEilzeemoefn(tT<)F n:, sTt,e pRSeidzOep_,) A{l g o| , ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ P r| o group(groupt o, COLL_UNROLL/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h>:(301).run(we); | ^ :90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 301 | Pr 7 | DEFINE_nccilDmeivtFiuvnecs(c,e ,/ *FDuinrceScutm=,* /h0a,l fP,r oNtCoC,L _0A>L GpOr_iTmRsEE , | N ^C CL_PROTO_SIMPL/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hE:)565 : 5| :^ note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406 :56552 | : note: expanded from macro 'DEFINE_ncclDevFunc' runTreeUp D406o | w n < T ,R uRneWdoOrpk,< cPorlolt,o Stiym,p lreeC,O LaLl_gUoN,R OpLrLo>t,o ,C O2L>L(_).UruNnR(O&LnLc>c(laSrhgmse)m;. w o| r ^k ); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:: 667note: :in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here15 : note: field 'nthreads' will be initialized after field 'tidInBlock' 203 | 667 | R utniWdo(rtkiEdl)e,m enntth,( )g.rrouunp((wger)o;up ) ,| ^ | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp::60:7: 1note: :field 'group' will be initialized after field 'stepSize' note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 667 | 7t | iDdE(FtINiEd_)n,c cnltDherveFaudnsc((nAtlhlrReeaddusc)e,_ TtRiEdEI_nSBIlMoPcLkE(_tPhrroeda_dfI6d4x,. xn)c,clFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads17), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | : warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nthreads(nthreadIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ s), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_)/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | PrimitivIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ escount; | ^~~~ , FanAsymmetric, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, P/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | r tid(ottiod,) ,0 >n tphrriemasd s (| n ^t hreads), tidInBloc/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hk:(t565h:r5e:a dnote: Iin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested hered x.x), gr o565u | p ( g r oruupn),T r e| e ^~~~~~~~~~~U pDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); 667| | ^ tid(tid),/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp :n12t:h1r:e anote: dsin instantiation of member function 'RunWork, 1, 2, 2>::run' requested here( nthreads), t i12d | IDnEBFlIoNcEk_(ntchcrleDaedvIFduxn.cx()A,l lgRreoduupc(eg_rRoIuNpG)_,S I M| P ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~L E _| P tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_r od_f64, ncc l668F | u n c A lsltReepdSuiczee,( sFtuenpcSPirzoed_, =d=o u0b l?e ,n cNcClCSLh_mAeLmG.Oc_oRmImN.Gb,u fNfCSCiLz_ePsR[ONTCOC_LS_IPMRPOLTEO)_ S I| M^P LE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(thre/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); 667| | ^ tid(tid), /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cppn:t7h:r1e:a dnote: sin instantiation of member function 'RunWork, 0, 2, 4>::run' requested here( nthre 7 | DEFINE_ncacdlsD)e,v FtuindcI(nBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdAx.x)l,l Rgerdouucpe(_gTrRoEuEp_)S,I M P| L ^~~~~~~~~~~E _PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ adIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ L>, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ clShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | R/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); u| ^ nWorkElement, 0, 2, 2>::run' requested hered Op, Algo, Prot o7, | DCEOFLLI_NUEN_RnOcLcL>l(D)e.vrFuunn(cw(eA)l;lR e d| ^u ce_TREE_SIMPLE_S/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cppu:m7_:f16:4 ,note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested heren cclFuncAllRedu c7e | ,D EFFuInNcES_unmc,c ldDoeuvbFluen,c (NAClCLl_RAeLdGuOc_eT_RTEREE,E _NSCICMLP_LPER_OSTuOm__SfI1M6P,L En)c c l| F^u ncAllRedu/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hc:e,406 :F52u:n cnote: Sexpanded from macro 'DEFINE_ncclDevFunc'u m, half, N406C | C L _ AL GROu_nTWRoErEk,< cNoClClL,_ PtRyO,T Or_eSdIoMpP , | a^l go, pr/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hot:o406:,52 :2 >(note: )expanded from macro 'DEFINE_ncclDevFunc'. run(&nccl S406h | m e m . wRournkW)o;r k\< c o| l ^l , ty, red/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.ho:p667<:t15y:> ,note: field 'nthreads' will be initialized after field 'tidInBlock'a lgo, proto, 6672> | ( ) . r utni(d&(ntcicdlS)h,m enmt.hwroerakd)s;( n\t h r| e ^a ds), tid/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hI:n667B:l15o:c knote: (field 'nthreads' will be initialized after field 'tidInBlock't hreadIdx.x) ,667 | g r o u pt(igdr(otuipd)), , | n ^~~~~~~~~~~~~~~~~t hread/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hs:(667n:t60h:r enote: afield 'group' will be initialized after field 'stepSize'd s), tidInB l667o | c k ( t htrieda(dtIiddx).,x )n,t hgrreoaudps((gnrtohurpe),a d s| ) ^~~~~~~~~~~~~~~~~, tid/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hI:n667B:l60o:c knote: (field 'group' will be initialized after field 'stepSize't hreadIdx.x )667, | g r o utpi(dg(rtoiudp)),, n t| h ^~~~~~~~~~~r eads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_u64, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f64, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), grIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ oup(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | R/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size =unWork, algo, args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, 0, 2, 4>::run' requested here 203 | ric, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), In file included from nt/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpph:r2e: aIn file included from d/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hs:(10n: tIn file included from h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.hr:e167a: d/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hs:)667,: 15t:i dIwarning: ninitializer order does not match the declaration order [-Wreorder-ctor]B lock(threadIdx.x), 667g | r o u p (tgirdo(utpi)d,) , | n ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~th r e| a tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_d s(nthreads), t668i | d I n B lsotcekp(Stihzree(asdtIedpxS.ixz)e,_ g=r=o u0p (?g rnocucpl)S,h m e| m ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~. c o| m tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_m .buffSizes[NC C668L | _ P R O sTtOe_pSSIiMzPeL(Es]t/eNpCSCizLe__S T=E=P S0/ s?i zneccolfS(hTm)e m:. csotmemp.Sbiuzfef_S)i z{e s [| N ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~C C L| _ group(groupP ROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hst:e252p:S90i:z enote: _in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group 252 | Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here anAsymmetri c252< | N C C L _ M APXr_iDmEiVt_iAvReIsT1d,: O In file included from p//builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h,:* 17DF: iaIn file included from rn/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.heA:cs11ty: m=In file included from m*/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.he/:t012r,: i In file included from cP/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h: X In file included from _p/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.hDr:Ei37Vm_: sAIn file included from R/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.hI: T14| Y: ^,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h :146>:,13 :/ *warning: Dunused function 'log2i' [-Wunused-function]i rect=*/0,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h : P56546r: | o5st:to a,note: t iin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested herec0 > l opnrgi mlso g 2| i ^(565 l | o n g nr)u n{T r e| e ^~~~~U pDo/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hw:n565<:T5,: note: Rin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested heree dOp, Proto 565S | i m p l erO,L LC>O,L LC_OULNLR_OULNLR>O(LaLr>g(sa)r;gs ) ;| ^ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h::203203::6666:: note: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested herein instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203203 | | RRuunnWWoorrkkEElleemmeenntt<>(())..rruunn((wwee));; | | ^ ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp::77::11:: note: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested herein instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 77 | | DDEFEIFNIEN_En_cncclcDleDveFvuFnucn(cA(lAllRleRdeudcuec_eT_RTEREE_ES_ISMIMPLE_Sum_f8P,L En_cSculmF_ufn8c,A lnlcRceldFuucnec,A lFluRnecdSucuem,, FrucncclS_ufml,o artc8c,l _NfClCoLa_tA8L,G ON_CTCRLE_EA,L GNOC_CTLR_EPER,O TNOC_CSLI_MPPRLOET)O _ S| I^M PLE) | ^/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h :406:52: note: expanded from macro 'DEFINE_ncclDevFunc' /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | Run W406o | r k < c oRluln,W otryk,< croeldlo,p r,e daolpgp,r oatlo,g o2,> (p)r.ortuon,( &2n>c(c)l.Srhumne(m&.nwcocrlkS)h;m e\m . w| o ^r k); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock'/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h :667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | ti d667 | ( t i d )t,i dn(tthirde)a,d sn(tnhtrheraedasd(sn)t,h rteiaddIsn)B,l otcikd(ItnhBrleoacdkI(dtxh.rxe)a,d Igdrxo.uxp)(,g rgoruopu)p,( g r| o ^~~~~~~~~~~~~~~~~u p), | ^~~~~~~~~~~~~~~~~/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h :667:60: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hnote: :field 'group' will be initialized after field 'stepSize'667 :60: note: field 'group' will be initialized after field 'stepSize' 667 | t i667d | ( t i d) ,t indt(htrieda)d,s (nntthhrreeaaddss(nt)h,r etaiddsI)n,B ltoicdkI(ntBhlroeackd(Ithdrxe.axd)I,d xg.rxo)u,p (ggroruopu(grpo)u,p ), | ^~~~~~~~~~~| ^~~~~~~~~~~ DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ?/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == ncclShmem.comm.buffSize0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(thresad[INdx.x), grouCpC(Lg_rPoRuOpT)O,_ S I| M ^~~~~~~~~~~P LE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ nthreads), tidInBlock(threadIdx.x), group(group), | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tiIn file included from d/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ (tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_R/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives,, n/t*hDrieraedcst(=n*t/h0r, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tid/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hInBl:o667c:k15(:t hrwarning: einitializer order does not match the declaration order [-Wreorder-ctor]a dIdx.x), group(group) ,667 | | ^~~~~~~~~~~~~~~~~ tid(t/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hi:d667):,60 :n tnote: hfield 'group' will be initialized after field 'stepSize'r eads(nthre a667d | s ) , ttiiddI(ntBildo)c,k (ntthhrreeaaddIsd(xnt.hxr)e,a dgsr)o,u pt(igdrIonuBpl)o,c k (| t ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~h r e| a tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_d Idx.x), 668 | stepSiz eg(rsotuepp(Sgirzoeu_p )=,= 0| ^~~~~~~~~~~? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDeoawdsn)<,T ,t iRdeIdnOBpl, oPcrko(ttohSriemapdlIed),, CO L| L ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~_ U N| R tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_O LL>(args); | ^668 | stepSize/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h(:s203t:e66p:S inote: zin instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested heree _ == 0 ? n203c | c l S h m e m .RcuonmWmo.rbkuEflfeSmieznets<[FNnC,C LT_,P RROeTdOOp_,S IAMlPgLoE,] /PrNoCtCoL,_ SCTOELPLS_/UsNiRzOeLoLf>((T)). r:u ns(tweepS)i;z e _| ) ^ { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 7 | DEFINE_ncc l301D | e v F u n c (PArlilmRietdiuvcees_,, r/c*cDli_rfelcota=t*8/,0 ,N CPCrLo_tAoL,G O0_>T RpErEi,m sN C C| L ^_ PROTO_SIMPL/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hE:)565 : 5| :^ note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406: 52565: | note: expanded from macro 'DEFINE_ncclDevFunc' runTreeU p406D | o w n < TR,u nRWeodrOkp<,c oPlrlo,t otSyi,m prleed ,C OaLlLg_oU,N RpOrLoLt>o,, C2O>L(L)_.UrNuRnO(L&Ln>c(calrSghsm)e;m . w| o ^r k); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h :note: 667in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here: 15: note: field 'nthreads' will be initialized after field 'tidInBlock' 203 | 667 | R u n Wtoirdk(Etliemde)n,t x(.)x.)r,u ng(rwoeu)p;( g r| o ^u p), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h7::6671::60 :note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested herenote: field 'group' will be initialized after field 'stepSize' 7667 | | D E F I NtEi_dn(ctcildD)e,v Fnutnhcr(eAaldlsRe(dnutcher_eTaRdEsE)_,S ItMiPdLIEn_BSluomc_kf1(6t,h rnecacdlIFduxn.cxA)l,l Rgerdouucpe(,g rFouunpc)S,u m ,| ^~~~~~~~~~~h alf, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ING_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown< note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ oll, ty, redop, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidIIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ nBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^~~~~~~~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ .buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x)/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ , grou/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f32, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ p(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: (tidinitializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h,: 1260: ,In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.hP:r14o: tIn file included from o/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h,: 370: >In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.hp:r14i: m/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.hs: 46 :| 13 ^: warning: unused function 'log2i' [-Wunused-function] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558: 546: | note: stin instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested herea tic lon g558 | l o g 2 ir(ulong n) { | ^~~~~ nRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ ing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | Ru17 warnings generated when compiling for host. nWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), In file included from | ^~~~~~~~~~~/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp :1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlocIn file included from k/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ (threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElementcount; | ^~~~ Algo, Proto, COLL_UNROLL>().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ PLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ :406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ LL>().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:12:1/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h: :note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here667 :15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 12 | DEFINE_nc c667l | D e v F utnicd((AtlilRde)d,u cnet_hRrIeNaGd_sS(InMtPhLrE_ePardosd)_,f 8t,i dnIcncBllFoucnkc(AtlhlrReeadduIcdex,. xF)u,n cgPrrooudp, (rgcrcolu_pf)l,o a t| 8 ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~, N| C tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_C L_ALGO_RING, 668N | C C L _ PsRtOeTpOS_iSzIeM(PsLtEe)p S i| z^e _ == 0 ? /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hn:c409c:l52S:h mnote: emexpanded from macro 'DEFINE_ncclDevFunc'. comm.buff S409i | z e s [ NRCuCnLW_oPrRkOP,S /asligzoe,of (pTr)o t:o, s t4e>p(S)i.zreu_n)( &{n c c| l ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~S h m| e group(groupm .work); \ | ^/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h :252:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock'252 | Prim i667t | i v e s x,. x/)*,D igrreocutp=(*g/r0o,u pP)r,o t | o ^~~~~~~~~~~~~~~~~, 0> pr/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hi:m667s: 60 :| ^note: field 'group' will be initialized after field 'stepSize' /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h :667565 | :5 : note: tin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested herei d(tid), nt h565r | ea d s (rnutnhTrreeaedUsp)Do,w nt| , ^~~~~~~~~~~ COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66NROLL>,: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPIn file included from LE/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp): 2| : ^/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h :33:19: warning: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hunused variable 'size' [-Wunused-variable]: 409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 33 | 409 | c o nRsutn Wsosrikzy>c,o uanltg;o , | p ^~~~r oto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(t/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hh:r667e:a15d:I dwarning: xinitializer order does not match the declaration order [-Wreorder-ctor]. x), group(group), 667 | | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | t tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_i d(tid), nthrea ds668( | n t h r esatdesp)S,i ztei(dsItneBplSoiczke(_t h=r=e a0d I?d xn.cxc)l,S hgmreomu.pc(ogmrmo.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ up), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_f16, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlo/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hck:(222t:h19r:e adwarning: Iunused variable 'size' [-Wunused-variable]d x.x), grou p222( | g r o u pc)o,n s t| ^~~~~~~~~~~s size_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h: 370409: | 19 : warning: unused variable 'size' [-Wunused-variable]R unWorks,s iazleg_ot, spirzoet o=, a4r>g(s)-.>rcuonu(n&tn;c c l| S ^~~~h mem.wor/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hk:)371;: 15\: warning: | unused variable 'bid' [-Wunused-variable] ^ 371 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h : 667 : 15c:o nnote: sfield 'nthreads' will be initialized after field 'tidInBlock't int bid = g667r | i d O f ftsiedt( t/i dc)h,a nnntehlrCeoaudnst(;n t h| ^~~r eads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h_S:u667m:_15u:3 2warning: ,initializer order does not match the declaration order [-Wreorder-ctor] ncclFuncAllReduc e667, | F u n ctSiudm(,t iudi)n,t 3n2t_htr,e aNdCsC(Ln_tAhLrGeOa_dTsR)E,E ,t iNdCICnLB_lPoRcOkT(Ot_hSrIeMaPdLIEd)x . x| )^, group(g/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hr:o409u:p52):, note: expanded from macro 'DEFINE_ncclDevFunc'| ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 409 | Ru n668W | o r k < csotlelp,S itzye,( srteedpoSpi ,= =a l0g o?, npcrcoltSoh,m e4m>.(c)o.mrmu.nb(u&fnfcScilzSehsm[eNmC.CwLo_rPkR)O;T O\_ S I| M ^P LE]/NCCL_S/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hT:E667P:S15/:s inote: zfield 'nthreads' will be initialized after field 'tidInBlock'e of(T) : ste p667S | i z e _ )t i{d ( t| i ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~d ) ,| group(groupn threads(nthreads), t/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hi:d301I:n90B:l onote: cin instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested herek (threadIdx.x )301, | g r o u p (Pgrriomuipt)i,v e s| < ^~~~~~~~~~~~~~~~~T , RedOp/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h,: 667F:a60n:A snote: yfield 'group' will be initialized after field 'stepSize'm metric<1, N C667C | L _ M A Xt_iDdE(Vt_iAdR)I,T Yn>t,h r/e*aDdisr(enctth=r*e/a0d,s )P,r ottiod,I n0B>l opcrki(mtsh r e| a ^d Idx.x), gro/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hu:p565(:g5r:o unote: pin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here) , | ^~~~~~~~~~~ 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.woIn file included from rk)/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp;: 2\: In file included from | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h ^: 10/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h: In file included from :/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h667::168/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h: 15::667/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h ::15warning: 140:initializer order does not match the declaration order [-Wreorder-ctor]: 14note: :field 'nthreads' will be initialized after field 'tidInBlock' warning: unused variable 'data1' [-Wunused-variable] 667 | 667 | t140 i | d ( tt ii ddu()it,ni tdn3)t2,h_ rtne tadhdasrte(ana1dt,sh (rfneltaahdgrs1e),a, d dsta)it,da I2tn,i BdfIllnoBaclgko2(c;tk h( rt| eh ^~~~~ar deIaddxI.dxx)./builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h,x: )140g,:r21 o:gu prwarning: o(uunused variable 'flag1' [-Wunused-variable]gp r(ogurpo)u,p ) ,140| | ^~~~~~~~~~~~~~~~~ | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ u| /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hi tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_:n 667t:3602:_ tnote: field 'group' will be initialized after field 'stepSize'd at a6681 | , f l as gt6671e | ,p S di az tetai(2ds,(t tefipldSa)ig,z 2en;_t h =r| =e ^~~~~ a 0d s?( nntch/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hcr:le140Sa:h28dm:se )mwarning: ,.unused variable 'data2' [-Wunused-variable] c toimdmI.nbBu lf140of | cS ki (z te hsur[ieNnaCtdC3IL2d__xPt.R xdO)aT,tO a_g1Sr,Io MufPplL(aEgg]r1/o,Nu CpdC)aL,t_ aS 2T| ,E ^~~~~~~~~~~P Sf/lsaigz2e;o f (| T ^~~~~) : step/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hS:i140z:e_35): {warning: unused variable 'flag2' [-Wunused-variable] | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group 140 | uint32_t d/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.ha:t62a:156,: fnote: lin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested herea g1, dat a622 | , f l aPgr2i;m i t| i ^~~~~v es, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIIn file included from MPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f32, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:t2: iIn file included from d/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h(:t10i: dIn file included from )/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h,: 168n: th/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hr:e140a:d14s:(n twarning: hunused variable 'data1' [-Wunused-variable]r eads), tidIn B140l | o c k ( tuhrienatd3I2d_xt. xd)a,t ag1ro,u pf(lgargo1u,p )d,a t a| 2 ^~~~~~~~~~~~~~~~~, flag2/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h;: 667 :| 60 ^~~~~: note: field 'group' will be initialized after field 'stepSize' /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21 :667 | warning: unused variable 'flag1' [-Wunused-variable] tid(t i140d | ) , n tuhirneta3d2s_(tn tdharteaa1d,s )f,l atgid1I,n Bdlaotcak2(,t hfrleaagd2I;d x. x| ) ^~~~~, grou/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hp:(140g:ro28u:p )warning: ,unused variable 'data2' [-Wunused-variable] | ^~~~~~~~~~~ 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static lon/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hg :lo667g:215i:( lwarning: oinitializer order does not match the declaration order [-Wreorder-ctor]n g n) { | ^~~~~ 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nIn file included from threads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | Ru/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nW17 warnings generated when compiling for host. ork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? nc/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ clShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h::17: 222In file included from :/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h19::11 : warning: In file included from unused variable 'size' [-Wunused-variable]/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h : 222 | const ssize_t size = args->count; | ^~~~ 12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) {In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_bf8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , Proto, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66 /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 558 | run/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: 17 warnings generated when compiling for host. warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, ProIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ to, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gro17u warnings generated when compiling for host. p(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ proto, 2>().run(&ncclShmem.wo/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ rk); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: 17 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f16, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: 409warning: | initializer order does not match the declaration order [-Wreorder-ctor] RunWorkd,( taildg)o,, nptrhorteoa,d s4(>n(t)h.rreuand(s&)n,c ctliSdhImneBml.owcokr(kt)h;r e\a d I| d ^x .x), grou/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hp:(667g:r15o:u pnote: )field 'nthreads' will be initialized after field 'tidInBlock', | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 667 | tid( t668i | d ) , nsttherpeSaidzse((nsttherpeSaidzse)_, =t=i d0I n?B lnoccckl(Sthhmreema.dcIodmxm..xb)u,f fgSirzoeusp[(NgCrCoLu_pP)R,O T O| _ ^~~~~~~~~~~~~~~~~S IMPLE]//builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hN:C667C:L60_:S Tnote: Efield 'group' will be initialized after field 'stepSize'P S/sizeof(T) 667 | : s t etpiSdi(ztei_d)) ,{ n t| h ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~r e a| d group(groups (nthreads), tidInB/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hlo:c301k:(90t:h rnote: ein instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested herea dIdx.x), gr o301u | p ( g r o u pP)r,i m i| t ^~~~~~~~~~~i ves, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ : warning: unused function 'log2i' [-Wunused-function]In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nt/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ hreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f16.cpp:117 warnings generated when compiling for host. : In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ >(/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ).run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFu:28: warning: unused variable 'data2' [-Wunused-variable] nc(AllReduce_TREE_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ E_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u64, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group)/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) :, | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_f32, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h| ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~: 667 :| 15 group(group: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h | : 252 : 90 :t inote: din instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here( tid), nth r252e | a d s ( n t hPrreiamdist)i,v etsi , /*Direct=* /6680 | , P r osttoe,p S0i>z ep(rsitmesp S i| z ^e _ == 0 ? nccl/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.hS:h565m:e5m:. cnote: oin instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested herem m.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUp 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduceD_ToRwEnE<_TS,I MRPeLdEO_pS,u mP_ru8o,t onScicmlpFluenu,m ,C OuLiLn_tU8N_RtO,L LN>C(CaLr_gALsG)O;_ T R| E ^E , NCCL_PROTO_S/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hI:M203P:L66E:) note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here| ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h: 406203: | 52 : note: expanded from macro 'DEFINE_ncclDevFunc' RunWo r406k | E l e m eRnutnt,o ,a lCgOoL,L _pUrNoRtOoL,L >2(>)(.)r.urnu(nw(e&)n;c c l| S ^h mem.work); \ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp :| 7 ^: 1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hfield 'nthreads' will be initialized after field 'tidInBlock' :7667 | :D15E:F I667warning: N | Einitializer order does not match the declaration order [-Wreorder-ctor] _ n c ctliDde(vtFiudn)c,( AnltlhRreed ua667cd | es _( Tn Rt EhtEri_edSa(IdtMsP)iL,dE )_,tSi udnImtn_hBurl3eo2ac,dk s(n(tcnhctrlheFraeudanIdcdsAx)l.,lx R)te,idd uIgcnreBo,lu opF(cugknr(cotSuhuprm)e,,a du I| id ^~~~~~~~~~~~~~~~~nx t.3x2/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h)_:,t667 ,:g 60rN:oC uCnote: pLfield 'group' will be initialized after field 'stepSize'(_ gArLoGuOp_)T,R E E| 667, ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | N | C tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ C tLi_dP(RtOiTdO)_,S InM tP668hL | rE e )a d ss (t| ne^tp Shirzeea(dsst/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h)e:p,409S :it52zi:ed _Inote: n=Bexpanded from macro 'DEFINE_ncclDevFunc'=l o0c k?( tnhcrc el409aS | dh Im de xm ..Rxcu)on,mW omgr.rkbo_,S IaMlPgLoE,] /pNrCoCtLo_,S T4E>P(S)/.sriuzne(o&fn(cTc)l S:h msteemp.Swiozrek_)); {\ | | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ ^ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here667 | tid (62t | i d ) , Pnrtihmrietaidvse(sna,d I0d,x .Pxr)o,t og,r o0u>p (pgrriomusp ) ,| ^ | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h::558667::560:: note: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested herefield 'group' will be initialized after field 'stepSize' 558 | 667 | r u nR i ntgit(iadrgIsn)B;l o c| k ^( threadIdx.x),/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h :g203r:o66u:p (note: gin instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested herer oup), | ^~~~~~~~~~~ 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDowncount; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWork Algo, Proto, COLL_UNROLL>().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Element().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h.x:)222,: 19g:r owarning: uunused variable 'size' [-Wunused-variable]p (group), 222| | ^~~~~~~~~~~ const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_f64, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] In file included from 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/device_table.cpp :7 | 2: DIn file included from E/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.hF:I13N: E_/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.hn:c76c:l18D:e vwarning: Funused variable 'y' [-Wunused-variable]u nc(AllReduce_T R76E | E _ S I M P L E _uSinutm3P2o_stt Dyi, vh_eua6d,4 ,m annctcilsFsuan;c A l| l ^R educe, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/device_table.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_tIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | 140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | u stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threiadIdx.x), group(group), | ^~~~~~~~~~~ nt32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, datIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ a2, flag2; In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLIn file included from E]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ 2 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:222:19: warning: unused variable 'size' [-Wunused-variable] 222 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:370:19: warning: unused variable 'size' [-Wunused-variable] 370 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:371:15: warning: unused variable 'bid' [-Wunused-variable] 371 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(grou1p), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ warning generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 80 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWo/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthrkElement, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), groupro(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ to, COLL_UNROLL>().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(t/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ id), nthrea/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hds(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 68%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/host_table.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/host_table.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/host_table.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/host_table.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/host_table.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), runTreeUpDown, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u32, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ProtoSimple<1, 1, COLL_UNROLL>, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPo/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hs:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSu/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 35 | PrimitivesC,L _0A,L GPOr_oRtIoN,G ,0 >N CpCrLi_mPsR O T| O ^_ SIMPLE) /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h| :^80 :5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406: 5280: | note: expanded from macro 'DEFINE_ncclDevFunc' runRingo(pa),; a l| g ^o , proto, 2/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h>:(203):.66r:u nnote: (in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here& ncclShme m203. | w o r k ) ; \ Ru n| W ^o rkElemen/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.ht:<667F:n15,: Tnote: ,field 'nthreads' will be initialized after field 'tidInBlock' RedOp, A l667g | o , P rtoitdo(t,i dC)O,L Ln_tUhNrReOaLdLs>((n)t.hrurne(awdes));, t| i ^d InBlock(th/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cppr:e3a:d1I: dnote: xin instantiation of member function 'RunWork, 1, 2, 4>::run' requested here. x), group(g r3o | uDpE)F,I N E| ^~~~~~~~~~~~~~~~~_ ncclDe/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hv:F667u:n60c:( Anote: lfield 'group' will be initialized after field 'stepSize'l ToAllPiv o667t | _ R I N Gt_iSdI(MtPiLdE)_,S unmt_hir8e,a dnsc(cnltFhurneacdAsl)l,T otAildlIPniBvlootc,k (FtuhnrceSaudmI,d xi.nxt)8,_ tg,r oNuCpC(Lg_rAoLuGpO)_,RI N G| , ^~~~~~~~~~~ NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(thIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ readIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x17 warnings generated when compiling for host. ), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(s/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); 9 warnings generated when compiling for host. | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 1 warning generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]//builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthrL>eads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDivIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ , int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nt/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ hreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), gr 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | o tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_up(group), | ^~~~~~~~~~~ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 68%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(t/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ hreadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ Size_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 2 warnings generated when compiling for gfx1100. 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(groIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ up), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5:In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ >, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PRO/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 667 | 62t | i d ( t iPdr)i,m intthirveeasdh,r e0adIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ TO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ , Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_u8, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 69%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nth/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ reads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \17 warnings generated when compiling for host. | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x),/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement:(18):. ruwarning: nunused variable 'y' [-Wunused-variable]( we); | ^ 76 | ui/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cppn:t123:21_:t note: yin instantiation of member function 'RunWork, 1, 2, 2>::run' requested here, head, mantis s12a | ;D E F| I ^N E_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 2>, 2>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCC/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(ti17 warnings generated when compiling for host. d), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclSh/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:252:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 252 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ mem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) :In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ 17 warnings generated when compiling for host. | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:301:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 301 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:565:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1, 4>, 4>' requested here 565 | runTreeUpDown, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 0, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/siIn file included from zeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:62:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 62 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/all_reduce.h:558:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 558 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for host. 9 warnings generated when compiling for gfx1100. [ 69%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 80 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:58:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 58 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 95 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 80 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 3 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_i8, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:58:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 58 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 95 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/host_table.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:58:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 58 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/alltoall_pivot_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 95 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 1 warning generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/host_table.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:58:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 58 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/broadcast.h:95:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 95 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_i8, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/broadcast_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. 1 warning generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 69%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | sIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ tepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threa/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.hdIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_In file included from ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ :1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ [ 69%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp 9 warnings generated when compiling for gfx1100. [ 70%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ [ 70%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp 17 warnings generated when compiling for gfx1100. [ 70%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. 9 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1100. [ 70%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp 17 warnings generated when compiling for gfx1100. [ 71%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u32.cpp.o 17 warnings generated when compiling for gfx1100. /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp [ 71%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp 17 warnings generated when compiling for gfx1100. [ 71%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 71%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp [ 72%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp 17 warnings generated when compiling for gfx1100. [ 72%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 72%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f32.cpp.o In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y,/usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. [ 72%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx1100. [ 73%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp [ 73%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1100. [ 73%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 73%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i8.cpp.o In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h/usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp :167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 74%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ [ 74%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u64.cpp.o 9 warnings generated when compiling for host. /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.bIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ uffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 17 warnings generated when compiling for gfx1100. [ 74%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ [ 75%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ [ 75%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf8.cpp.o In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp 17 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: 17 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 75%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp [ 75%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ [ 76%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 17 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | s/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ tepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1100. [ 76%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f8.cpp.o [ 76%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ [ 76%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 77%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 77%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t dIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ ata1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ o, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIIn file included from ZE/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp):, 1 : | In file included from ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h : 12| : warp(tid/WARP_SIZE In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h: 76506: | 18 : warning: funused variable 'y' [-Wunused-variable]l agThread((ti d76% | 4 ) = u=int32_t y, head, mantissa; | ^ 3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | m17 warnings generated when compiling for gfx1100. scclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ [ 77%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, In file included from flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, In file included from head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto,13 : 0In file included from >/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h p:r168i: m/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hs: 140 :| 14 ^: warning: unused variable 'data1' [-Wunused-variable] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here140 | ui n3t | 3M2S_CtC Ld_aItMaP1L,_ KfElRaNgE1L,_ EdNaTtRa2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ Y_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ [ 77%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u8.cpp.o In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ [ 78%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ _t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ [ 78%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreterIn file included from , ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_tIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ )) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | PrimiIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:ti1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ ves, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, woIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ rk); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | ui17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ nt32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cppIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ [ 78%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreaIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIds), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ dx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ : note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInte9 warnings generated when compiling for host. rpreterIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ , ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group 17 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. : note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 9 warnings generated when compiling for host. 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128OIn file included from ffset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ [ 78%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f32.cpp.o In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(ste9 warnings generated when compiling for gfx1100. pSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ rpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ [ 79%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f64.cpp.o In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_MinMax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h/usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp :14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 79%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f8.cpp.o In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f64.cpp:1: /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_tIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ reads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ 9 warnings generated when compiling for gfx1100. | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 79%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.hIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ :506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL[ 79%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u64.cpp.o 128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives , 1, Proto, 0140> | p r i musi n t| 3 ^2 _t data1, fl/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cppa:g31:,1 :da tnote: ain instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here2 , flag 23; | M S| C ^~~~~C L_IMPL/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h_:K140E:R21N:E Lwarning: _unused variable 'flag1' [-Wunused-variable]E NTRY_FU N140C | _ D E V RuEiDnOt3P2__TtY PdEa(tSau1m,, frlcacgl1_b,f ldoaatta82,, ffallasge2);; | | ^~~~~^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h::28405:: 3warning: :unused variable 'data2' [-Wunused-variable] note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 140 | 405 | u i nmts3c2c_ltR udantIan1t,e rfplraegt1e,r :,35 :P rwarning: ounused variable 'flag2' [-Wunused-variable]t oLL128, f140u | l l O p su>i(ncto3m2m_,t adlagtoa,1 ,w ofrlka)g;1 ,\ d a| t ^a 2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threa/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ dIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:609 warnings generated when compiling for gfx1100. : note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid),In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(gIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ roup), | ^~~~~~~~~~~ [ 80%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp [ 80%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf16.cpp.o In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreaIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ ds), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h::1220: :In file included from 57/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:: 13note: : In file included from in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h :168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14 :220 | warning: unused variable 'data1' [-Wunused-variable] Primitives< T140, | R e d Oupi,n tF32a_ntA sdyamtmae1t,r ifcl ,d a1t,a 2P,r oftloa,g 20;> p| r ^~~~~i ms | ^/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h :140:21: warning: unused variable 'flag1' [-Wunused-variable] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp :1403 | : 1 : unote: iin instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested heren t32_t dat a31 | ,M SfClCaLg_1I,M PdLa_tKaE2R,N EfLl_aEgN2T;R Y _| F ^~~~~U NC_DEV/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hR:E140D:O28P:_ Twarning: Yunused variable 'data2' [-Wunused-variable]P E(Prod, 140i | n t 8 _ tu,i nfta3l2s_et) ;d at a| 1^, flag1, d/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.ha:t405a:2,3 :f lnote: aexpanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE'g 2; | ^~~~~ 405/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h | : 140 :m35s:c cwarning: lunused variable 'flag2' [-Wunused-variable]R unInterp r140e | t e r < tuyinpte3,2 _Ftu ndca#t#ad1e,v rfeldaogp1<,t ydpaet>a,2 ,P rfoltaogL2L;1 2 8| , ^~~~~ fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for host. 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | s[ 80%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp tatic long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.bu/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ ffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRIn file included from Y_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ :168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ [ 80%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ ZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ 9 warnings generated when compiling for host. 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : step9 warnings generated when compiling for host. Size_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 81%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ : In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), grIn file included from o/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ up(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof9 warnings generated when compiling for gfx1100. (T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408In file included from :3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, f9 warnings generated when compiling for gfx1100. lag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ [ 81%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 81%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f8.cpp.o In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.huint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ [ 81%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u32.cpp.o | warp(tid/WARP_SIZE 506 | flagThread((tid%/usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp 4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInteIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ rpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ ARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:39 warnings generated when compiling for host. : note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | p17r warnings generated when compiling for gfx1100. ims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group)In file included from , | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_bf16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 82%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 82%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(grouIn file included from p), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(steIn file included from pSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint329 warnings generated when compiling for gfx1100. _t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 82%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76[ 82%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf8.cpp.o | uint32_t y, head, mantissa; | ^ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: 9 warnings generated when compiling for gfx1100. note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMaIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ x_f32, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBloc/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f16, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ k(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for host. [ 83%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ [ 83%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168[ 83%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f64.cpp.o : /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->reIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ dOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ [ 83%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring-In file included from >next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PIn file included from R/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ OTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable]epSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->pre 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ v, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8, ncclFuncReduce, FuncMi[ 84%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u32.cpp.o nMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), groupIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ (group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthrea9ds warning(nst generatedh when compiling for rgfx1100e. ads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Size_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthread/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f32, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ s, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem./builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:506:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 504 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 505 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 506 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 507 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:220:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 220 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:3:1: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:408:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 408 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threa[ 84%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u64.cpp.o dIdx.x), group(group), In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Mi9nM warningasx generated_ when compiling for ugfx11006. 4, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for host. == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prIn file included from i/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ ms(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ [ 84%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: 9 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 84%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf16.cpp.o In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/msccl_kernel_Sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:14/usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp : In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads[ 85%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf8.cpp.o (nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63In file included from | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp : 2 : rIn file included from u/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.hn:R10i: nIn file included from g/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h<:T167,: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hR:e667d:O15p:, warning: Pinitializer order does not match the declaration order [-Wreorder-ctor]r oto, CO 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ LL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RINIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ G_SIMPLE_MinMax_u32, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1100. [ 85%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(In file included from st/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cppe:p1S: iIn file included from z/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.he:_17 : =In file included from =/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h :011 : ?In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.hn:12c: cIn file included from l/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.hS:h126m: eIn file included from m/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h.:c14: oIn file included from m/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.hm:.37b: uIn file included from f/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.hf:S14i: z/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.he:46s:[13N:C Cwarning: Lunused function 'log2i' [-Wunused-function]_ PROTO_SIMP L46E | ]s/tNCaCtiL_cS TloEnPgS /lsoigz2eio(fl(onTg) n:) s{t e p| S ^~~~~ ize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u32, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ [ 85%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().9 warnings generated when compiling for gfx1100. run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h[ 85%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f64.cpp.o :63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_f64, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ : note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 86%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 86%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.workL_STEPS/); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ Size(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, argIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/s->connIndex); sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u8, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flalock(threadIdgx1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ .x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_u64, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(t9 warnings generated when compiling for gfx1100. hreadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; 9 warnings generated when compiling for host. | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthrIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ eads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ [ 86%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128O9f warnings generated when compiling for gfx1100. fset; | ^~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sIn file included from izeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group [ 86%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u8.cpp.o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ [ 87%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduIn file included from c/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthree_RING_SIMPLE_PreMulSum_f8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ ads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreadIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ s), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 63 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | D EF I NrEu_nnRcicnlgDM(ualrSgusm)_;f 3 2| , ^ ncclFuncReduce,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h :F203u:n66c:P rnote: eMin instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested hereu lSum, flo a203t | , N C C L _ A L GROu_nRWIoNrGk,E lNeCmCeLn_tP(). r406u | n ( w e )R;u n W| o ^r kin instantiation of member function 'RunWork, 1, 2, 4>::run' requested here, algo, proto ,7 | 2D>E(F)I.NrEu_nn(c&cnlcDcelvSFhumnecm(.Rweodrukc)e;_ R\I N G| _ ^S IMPLE_PreMul/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hS:u667m:_15f:1 6note: ,field 'nthreads' will be initialized after field 'tidInBlock' ncclFuncRedu c667e | , F u ntciPdr(etMiudl)S,u mn,t hhraelafd,s (NnCtChLr_eAaLdGsO)_,R ItNiGd,I nNBClCoLc_kP(RtOhTrOe_aSdIIMdPxL.Ex)) , | g^r oup(gr/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.ho:u409p:)52,: note: | expanded from macro 'DEFINE_ncclDevFunc' ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h: 667409: | 60 : note: field 'group' will be initialized after field 'stepSize'Ru nWork ,n tahlrgeoa,d sp(rnotthor,e a4d>s()),. rtuind(I&nnBclcolcSkh(mtehmr.ewaodrIkd)x;. x\) , | g ^r oup(grou/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hp:)667,: 15 :| ^~~~~~~~~~~note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ [ 87%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f16, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ : In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1,issa; | ^ data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T)In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_ProIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ d_f64, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ id(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRingIn file included from (/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.ha:r13g: s)/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h;: 76 :| 18 ^: warning: unused variable 'y' [-Wunused-variable] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203 :7666 | : note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here uint 32032 | _ t y , h e aRdu,n WmoarnktEilsesmae;n t <| F ^n , T, RedOp, Algo, Proto, COLL_UNROLL>().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ Arg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f32, ncclFuncReduce, FuncPreIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ MulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:In file included from 28: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cppwarning: :unused variable 'data2' [-Wunused-variable]2 : In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h140: | 169 : /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h : 270u:i19n:t 3warning: 2_unused variable 'ptr' [-Wunused-variable]t data1, flag 1270, | d a t a 2 , fuliangt26;4 _ t| * ^~~~~ ptr = /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hr:e140c:v35P:t rwarning: (0unused variable 'flag2' [-Wunused-variable]) +ll128O f140f | s e t ; u i| n ^~~t 32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128OffsetIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizesIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ [NCCL_PROTO_SIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ IMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement()In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ .run(we); In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_nIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ cclDevFunc(Reduce_RING_SIMPLE_Prod_f16, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunIn file included from Work, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); 9 warnings generated when compiling for gfx1100. | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().r9 warnings generated when compiling for host. un(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid),In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u32, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64, ncclFuncReduce, FuncP[ 87%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f16.cpp.o reMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmemIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ .comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, arg/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ s->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | s[ 88%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f32.cpp.o tatic long log2i(long n) { | ^~~~~ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ , flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128OffsIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ et; | ^~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] [ 88%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f64.cpp.o 76 | uint32_t y, head, mantissa; | ^ 140 | uint32_t data1, flag1, data2/usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp , flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ L_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f16, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | In file included from uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>()[ 88%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f8.cpp.o .run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x/usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ ), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFuncIn file included from (R/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cppe:du2c: eIn file included from _/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.hRI:N10G: _In file included from S/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.hI:M167P: L/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hE:_667P:r15o:d _warning: uinitializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u8, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(6nthre4a,d sn)c,c ltFiudnIcnRBeldouccke(,t hFruenacdPIrdoxd.,x )u,i ngtr6o4u_pt(,g rNoCuCpL)_,AL G O| _ ^~~~~~~~~~~~~~~~~R ING, N/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hC:C667L:_60P:R Onote: Tfield 'group' will be initialized after field 'stepSize'O _SIMPLE) | ^667 | tid/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h(:t406i:d52):, note: nexpanded from macro 'DEFINE_ncclDevFunc't hreads(nth r406e | a d s ) ,R utniWdoIrnkBg,r oaulpg(og,r opurpo)t,o , | 2 ^~~~~~~~~~~> ().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ edOp, Proto, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u32, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h: uint64_t* ptr = recvPtr(0)270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ +ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f64, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ COLL_UNROLL>().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSi/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hze:_667 :=15=: 0warning: initializer order does not match the declaration order [-Wreorder-ctor]? ncclShmem.comm.b u667f | f S i z etsi[dN(CtCiLd_)P,R OnTtOh_rSeIaMdPsL(En]t/hNrCeCaLd_sS)T,E PtSi/dsIinzBeloofc(kT()t h:r esatdeIdpxS.ixz)e_, )g r{o u p| ( ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~g r o| u group(groupp ), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: 668in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here | stepSize(st e33p | S i z e _ p=r=i m0 s(?t indc,c lnSthhmreema.dcosm,m .&bruifnfgS-i>zperse[vN,C C&Lr_iPnRgO-T>On_eSxItM,P LaEr]g/sN-C>Csendbuff, arLg_sS-T>ErPeSc/vsbiuzfefo,f (aTr)g s:- >srteedpOSpiAzreg_,) 0{, a| r ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~g s -| > group(groupc onnIndex, args->/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.hc:o34n:n7I:n dnote: ein instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested herex ); | ^ 34 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h : 63 : 5 :p rnote: iin instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested herem s(tid, nt63h | r e a d sr,u n&Rriinngg<-T>,p rReevd,O p&,r iPnrgo-t>on,e xCtO,L La_rgUsN-R>OsLeLn>d(baurfgfs,) ;a r g| s ^- >recvbuff, a/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hr:g203s:-66>:r enote: din instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested hereO pArg, 0, a203r | g s - > c o n n IRnundWeoxr,k Ealregmse-n>tc, ProtoSimple<2, 2, 4>, 4>' requested hereR OLL>(). r65u | n ( w e )r;u n R| i ^n g, 1, 2, 4>::run' requested hereO LL_UNROLL>(arg s7) | ;D E F| I ^N E_ncclDevFu/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hn:c203(:R66e:d ucnote: ein instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here_ RING_SIMP L203E | _ P r e M u l S uRmu_nuW8o,r knEclcelmFeunntcm(,) .uriunnt(8w_et),; N C| C ^L _ALGO_RING, N/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cppC:C7L:_1P:R Onote: TOin instantiation of member function 'RunWork, 1, 2, 4>::run' requested here_ SIMPLE) | ^ 7 | DEFI/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hN:E409_:n52c:c lnote: Dexpanded from macro 'DEFINE_ncclDevFunc'e vFunc(Red u409c | e S c a tRtuenrW_oRrIkN,, naclcgloF,u npcRreodtuoc,e S4c>a(t)t.erru,n (F&unncccMliSnhMmaexm,. wrocrckl)_;b f\l o a| t ^8 , NCCL_A/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hL:G667O:_15R:I Nnote: Gfield 'nthreads' will be initialized after field 'tidInBlock', NCCL_PRO T667O | _ S I M PtLiEd)( t i| d^) , nthr/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.he:a409d:s52(:n tnote: hexpanded from macro 'DEFINE_ncclDevFunc' reads )409, | t i d IRnuBnlWoocrkk((,g raolugpo,) ,p r o| t ^~~~~~~~~~~~~~~~~o , 4>()/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h.:r667u:n60(:& ncnote: cfield 'group' will be initialized after field 'stepSize'l Shmem.wor k667) | ; \ t| i ^d (tid), /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hn:t667h:r15e:a dnote: sfield 'nthreads' will be initialized after field 'tidInBlock'( nthreads )667, | t i d ItniBdl(otcikd()t,h rnetahdrIedaxds.(xn)t,h grreoaudps()g,r otuipd)I,n B | ^~~~~~~~~~~ lock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(thIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h667: | 168 : /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h : t140i:d14(:t iwarning: dunused variable 'data1' [-Wunused-variable]) , nthreads( n140t | hr e a dusi)n,t 3t2i_dtI ndBaltoa1c,k (ftlharge1a,d Iddaxt.ax2),, fglraogu2p;( g r| o ^~~~~u p), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h : 140| : tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_21 : warning: unused variable 'flag1' [-Wunused-variable] 668 | 140 | s tueipnSti3z2e(_stt edpaStiaz1e,_ f=l=a g01 ,? dnactcal2S,h mfelma.gc2o;m m .| b ^~~~~u ffSiz/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.he:s140[:N28C:C Lwarning: _unused variable 'data2' [-Wunused-variable]P ROTO_SI M140P | L E ] / NuCiCnLt_3S2T_EtP Sd/astiaz1e,o ff(lTa)g 1:, sdtaetpaS2i,z ef_l)a g{2 ; | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~| ^~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uin/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.ht3:233_:t7 :d anote: tin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested herea 1, flag1, data 233, | f l a g 2 ;p r i| m ^~~~~s (tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ readIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx9 warnings generated when compiling for gfx1100. .x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:935: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ warnings generated when compiling for gfx1100In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ . In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for host. 9 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_f64, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u64, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ [ 88%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp [ 89%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 89%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u8.cpp.o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tid/usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp InBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 9 warnings generated when compiling for host. 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ Ring(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_u64, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(thIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ readIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:In file included from 19/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140: warning: unused variable 'ptr' [-Wunused-variable] 270 | | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_bf8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | ti/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hd:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork,(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connInde/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f32, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ x, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSi/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ zes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? nIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ cclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_f8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x),In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | 9 warnings generated when compiling for host. runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_OLL>().run(we); RING_SIMPLE_Prod_f8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group),In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf 16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ [ 89%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp [ 89%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_bf16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1100. In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ [ 90%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_u8, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f16, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f64, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: 9unused variable 'data1' [-Wunused-variable] warnings generated when compiling for host. 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ :140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u32, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 90%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f32, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 90%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] [ 90%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f8.cpp.o 140 | uint32_t data1, flag1, dat/usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp a2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(g[ 91%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u32.cpp.o roup), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 91%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_f8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u64, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads,In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_u8, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ ag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_In file included from 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_minmax_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 91%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp [ 91%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf16.cpp.o In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 92%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlockIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ (threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, aIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing>r(eadrOgpsA)r;g , | 0 ^, args->con/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hn:I203n:d66e:x ,note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested herea rgs->con n203 | I n d e x ) ; R| u ^n WorkElement, ProtoSimple<2, 2, 4>, 4>' requested hereg o, Proto ,65 | C O L L _rUuNnRROiLnLg><(T),. rRuend(Owpe,) ;P r o| t ^o , COLL_U/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cppN:R7O:L1L:> (note: ain instantiation of member function 'RunWork, 1, 2, 2>::run' requested herer gs); | ^ 7 | DEFINE/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h_:n203c:c66l:D enote: vin instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested hereF unc(Reduc e203S | c a t t e r _ R IRNuGn_WSoIrMkPELlEe_mPernetMr(e)M.urluSnu(mw,e )f;l o a| t ^, NCCL_ALGO/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp_:R7I:N1G:, note: Nin instantiation of member function 'RunWork, 1, 2, 4>::run' requested hereC CL_PROTO_SIMP L7E | )D E F| I^N E_ncclD/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.he:v406F:u52n:c (note: Rexpanded from macro 'DEFINE_ncclDevFunc'e duceScat t406e | r _ R I NRGu_nSWIoMrPkLc,l FaulngcoR,e dpurcoetSoc,a t2t>e(r),. rFuunn(c&PnrcecMluSlhSmuemm,. wdoorukb)l;e ,\ N C| C ^L _ALGO_RI/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hN:G667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ , NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | sta/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tic long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t datIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ a1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for host. 9 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ In file included from 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h,: 140a:l14g:o , warning: punused variable 'data1' [-Wunused-variable]r oto, 2>(). r140u | n ( & n cucilnSth3m2e_mt. wdoartka)1;, \f l a| g ^1 , data2, /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hf:l667a:g152:; note: field 'nthreads' will be initialized after field 'tidInBlock'| ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h: 140667: | 21 : warning: unused variable 'flag1' [-Wunused-variable]t id(tid )140, | n t h rueiandts3(2n_tth rdeaatdas1),, ftliadgI1n,B ldoactka(2t,h rfelaadgI2d;x . x| ) ^~~~~, gro/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hu:p140(:g28r:o uwarning: punused variable 'data2' [-Wunused-variable]) , | ^~~~~~~~~~~~~~~~~ 140 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h : 667 :u60i:n tnote: 3field 'group' will be initialized after field 'stepSize'2 _t data1 ,667 | f l a g 1t,i dd(attiad2),, fnltahgr2e;a d s| ( ^~~~~n thre/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.ha:d140s:)35,: twarning: iunused variable 'flag2' [-Wunused-variable]d InBloc k140( | t h r e audiIndtx3.2x_)t, dgartoau1p,( gfrloaugp1),, d a| t ^~~~~~~~~~~a 2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSizIn file included from e_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | [ 92%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f16.cpp.o tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(grou/usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp p), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->reIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ringIn file included from ->/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cppn:e1x: tIn file included from ,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h :a17r: gIn file included from s/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h-:>11s: eIn file included from n/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.hd:b12u: fIn file included from f/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h,: 126a: rIn file included from g/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.hs:-14>: rIn file included from e/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.hc:v37b: uIn file included from f/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.hf:,14 : a/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.hr:g46s:-13>:r edwarning: Ounused function 'log2i' [-Wunused-function]p Arg, 0, 46a | rsgtsa-t>icco nlnoInngd elxo,g 2air(glso-n>gc onnn)I n{d e x| ) ^~~~~; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ cvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f16, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork9, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ warnings generated when compiling for host. [ 92%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), groupIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ (group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_bf8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f64, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ Proto, COLL_UNROLL>(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RINIn file included from G_SIMPLE_PreMulSum_f16, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? nIn file included from cclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | step9 warnings generated when compiling for gfx1100. Size(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid([ 92%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f64.cpp.o tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u64, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ E_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u32, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL[ 93%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f8.cpp.o _ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52:/usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_u8, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.xIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ ), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ [ 93%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32, ncclFuncReduceScatter, FuncPreMulSum, floatIn file included from , NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | 9 warnings generated when compiling for gfx1100. RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f32, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] [ 93%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u64.cpp.o 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.bu[ 93%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u8.cpp.o ffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), n[ 94%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp.o threads(nthreads), tidInBlock(threadIdx.x),/usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/siz9 warnings generated when compiling for gfx1100. eof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 94%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here u203i | n t3 2 _ t d a tRau1n,W ofrlkaEgl1e,m ednatta<2F,n ,f lTa,g 2R;ed O p| , ^~~~~ Algo, Pro/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.ht:o,140 :C21O:L Lwarning: _unused variable 'flag1' [-Wunused-variable]U NROLL>() .140r | u n ( w eu)i;n t 3| 2 ^_ t data1, flag/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp1:,7 :d1a:t anote: 2,in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here flag2; | ^~~~~ 7 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hD:E140F:I28N:E _warning: nunused variable 'data2' [-Wunused-variable]c clDevFun c140( | R e d u cueiSncta3t2t_etr _dRaItNaG1_, SfIlMaPgL1E,_ Pdraotda_2f,3 2f,l ang2c;c l F| u ^~~~~n cReduc/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.he:S140c:a35t:t ewarning: runused variable 'flag2' [-Wunused-variable], 140 | uint32_tF udnactPar1o,d ,f lfalgo1a,t ,d aNtCaC2L,_ AfLlGaOg_2R;I N G| , ^~~~~ NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->r/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ edOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), grouIn file included from p/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ (group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 94%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_f8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ | ^ [ 94%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ : In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_premulsum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreadsIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ , &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f16, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:[ 95%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp.o 1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f32, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlockIn file included from (threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 95%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_bf16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCC 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ L_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadId9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ x.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 9 warnings generated when compiling for host. 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group)In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1100. , | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 95%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f64, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ : In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInB[ 95%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf8.cpp.o lock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u32, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ 9 warnings generated when compiling for gfx1100. | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t dat | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' a1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROIn file included from TO/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp_:S2I: MIn file included from P/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.hL:E10): In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h| :^168 : /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hwarning: :unused variable 'data1' [-Wunused-variable]406 :52: note: expanded from macro 'DEFINE_ncclDevFunc' 140 | 406 | u i n t 3R2u_ntW odraktl,a ga2l;g o ,| ^~~~~p roto, /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h2:>140(:)21.:r uwarning: nunused variable 'flag1' [-Wunused-variable]( &ncclSh me140m | . w o r ku)i;n t\3 2 _| t ^ data1, fl/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.ha:g6671:,15 :d anote: tfield 'nthreads' will be initialized after field 'tidInBlock'a 2, flag2; | 667 ^~~~~ | t/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hi:d140(:t28i:d )warning: ,unused variable 'data2' [-Wunused-variable] nthread s140( | n t h r euaidnst)3,2 _tti ddIantBal1o,c kf(ltahgr1e,a ddIadtxa.2x,) ,f lgargo2u;p ( g| r ^~~~~o up), /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h :| 140 ^~~~~~~~~~~~~~~~~: 35: warning: unused variable 'flag2' [-Wunused-variable] /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: 140note: | field 'group' will be initialized after field 'stepSize' uint32_ t667 | d a t a 1t,i df(ltaigd1),, d anttah2r,e afdlsa(gn2t;h r e| a ^~~~~d s), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u64, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ [ 96%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f16.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f16.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f16.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_f8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ [ 96%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ ads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:2: In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f16, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ [ 96%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ [ 96%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tidIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ (tid), nthreads(nthrIn file included from eads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ [ 97%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u32.cpp.o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f32, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] [ 97%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u64.cpp.o 46 | static long log2i(long n) { | ^~~~~ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp [ 97%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u8.cpp.o In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, dat/usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp a2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_bf8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, aIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ lgo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 17 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReducIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ eScatter_RING_SIMPLE_Sum_bf8, ncclFuncIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ ReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for host. [ 97%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i32.cpp.o /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ [ 98%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp [ 98%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid)In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantis,sa ;n t h| r ^e ads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_u8, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &In file included from ri/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cppn:g2-: >In file included from p/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.hr:e10v: ,In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h&:r167i: n/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hg:-667>:n15e:x t,warning: initializer order does not match the declaration order [-Wreorder-ctor]a rgs->sendbuff, args- >667r | e c v b utfifd,( tairdg)s,- >nrtehdrOepaAdrsg(,n t0h,r eaardgss)-,> ctoindnIInnBdlexo,c ka(rtghsr-e>acdoIndnxI.nxd)e,x )g;r o u| p ^( group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 668 | 65s | t e p S irzuen(Rsitnegpu(fafrSgisz)e;s [ N| C ^C L_PROTO_SIMPL/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hE:]203/:N66C:C Lnote: _in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested hereS TEPS/size o203f | ( T ) : s t eRpuSniWzoer_k)E l{e m e| n ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~t < F| n group(group, T, RedOp, Algo, Proto, COLL_UNROLL/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h>(:)34.:r7u:n (note: win instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested heree ); | ^ 34 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp : 7 : 1p:r inote: min instantiation of member function 'RunWork, 1, 2, 2>::run' requested heres (tid, nthre a7d | sD,E F&IrNiEn_gn-c>cplrDeevv,F u&nrci(nRge-d>unceexStc,a tatregrs_-R>IsNeGn_dSbIuMfPfLE,_ Saurmg_sf-6>4r,e cnvcbculfFfu, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f8, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_prod_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ [ 98%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u32.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u32.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u32.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u32.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h | uint32_t y, head, mantissa; | ^ :140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, dataIn file included from 2, /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cppf:la1g: 2In file included from ; /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h :| 17 ^~~~~: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_f64, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex);9 warnings generated when compiling for gfx1100. | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PRIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ OTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1100. [ 98%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u64.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u64.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u64.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u64.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ [ 99%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u8.cpp.o /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ ize(stepSize_ == 0 ? ncclShmem.comm.buffSi[ 99%] Building CXX object CMakeFiles/rccl.dir/hipify/gensrc/sendrecv_sum_i8.cpp.o zes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/s/usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/hipify/gensrc/sendrecv_sum_i8.cpp.o -MF CMakeFiles/rccl.dir/hipify/gensrc/sendrecv_sum_i8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/gensrc/sendrecv_sum_i8.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp izeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: [ 99%] Building CXX object CMakeFiles/rccl.dir/git_version.cpp.o in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nth/usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60300 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/network/unpack -I/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -parallel-jobs=12 -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx1100 -MD -MT CMakeFiles/rccl.dir/git_version.cpp.o -MF CMakeFiles/rccl.dir/git_version.cpp.o.d -o CMakeFiles/rccl.dir/git_version.cpp.o -c /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/git_version.cpp reads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1,In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->send/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u8, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ buff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(argsIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduceScatter, FuncSumPIn file included from os/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u8.cppt:D1i: vIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h,: 17i: nIn file included from t/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h6:411_: tIn file included from ,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h: 12N: CIn file included from C/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.hL_:A126L: GIn file included from O/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h_:R14I: NIn file included from G/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h,: 37N: CIn file included from C/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.hL:_14P: R/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.hO:T46O:_13S:I Mwarning: Punused function 'log2i' [-Wunused-function]L E) | ^ 46 | st/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.ha:t409i:c52 :l onote: nexpanded from macro 'DEFINE_ncclDevFunc'g log2i(l o409n | g n ) R{u n W| o ^~~~~r k, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ ) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSiIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ zes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u64, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tidIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ ), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_u32, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), In file included from | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(g/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ roup), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | pri9m warnings generated when compiling for host. s(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 9 warnings generated when compiling for host. 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEP:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ S/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t d9 warnings generated when compiling for host. ata1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(g/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hro:up667):,15 : | warning: ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~initializer order does not match the declaration order [-Wreorder-ctor] | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | 667 | s tteipdS(itzied()s,t enptShirzeea_d s=(=n t0h r?e andcsc)l,S htmiedmI.ncBolmomc.kb(utfhfrSeiazdeIsd[x.NxC)C,L _gPrRoOuTpO(_gSrIoMuPpL)E,] / N| C ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~C L _| S tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_T EPS/sizeof (668 | T ) : sstteeppSSiizzee(_s)t e{p S i| z ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~e _| = group(group= 0 ? ncclSh/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.hm:e34m:.7c:o mnote: min instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here. buffSizes[ N34C | C L _ P R O TpO_rSiImMsP(LtEi]d/,N CnCtLh_reSaTdEsP,S /&sriiznego-f>(pT)r e:v ,s &treipnSgi-z>e_n)e x{t, a| r ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~g s -| > group(groups endbuff, ar/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.hg:s34-:>7r:e cnote: vin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested hereb uff, args-> 34r | e d O p A r gp,r i0m,s (atrigds,- >nctohnrneInaddesx,, &arrignsg-->>pcorennvI,n d&erxi)n;g - >| n ^e xt, args/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h-:65>:se5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66:ndbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), groIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ up(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSizeIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ _ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ Arg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ lock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, man/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ tissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFun9 warnings generated when compiling for gfx1100. c(Reduce_RING_SIMPLE_Sum_bf8, ncclFuncReduce, FuncSum, rcclIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ _bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ threads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ antissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tiIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ d(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 2>, 2>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f16, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduceScatter, FuncSumPIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ ostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2, 4>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2, 4>, 4>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(gIn file included from ro/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cppu:p2): ,In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h :| 10 ^~~~~~~~~~~~~~~~~: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h::667270::6019:: note: warning: field 'group' will be initialized after field 'stepSize'unused variable 'ptr' [-Wunused-variable] 667 | 270 | t i d ( t iudi)n,t 6n4t_htr*e apdtsr( n=t hrreecavdPst)r,( 0t)i+dlIln1B2l8oOcfkf(stehtr;e a d| I ^~~d x.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1In file included from , data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(grouIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ p), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128OffsetIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ ; | ^~~ 9 warnings generated when compiling for host. In file included from In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid)In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ , nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOp/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ :667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ x.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElementIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ ().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_bf16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cppIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ :1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(grouIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] p), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested hereIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_bf16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ WorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(ntIn file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ hreads), tidInBlock(threadIdx.x), group(group), 9 warnings generated when compiling for host. | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp668: | 2 : In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h :s10t: eIn file included from p/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.hS:i168z: e/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h(:s140t:e14p:S izwarning: eunused variable 'data1' [-Wunused-variable]_ == 0 ? n cc140l | S h m e mu.icnotm3m2._btu fdfaStiaz1e,s [fNlCaCgL1_,P RdOaTtOa_2S,I MfPlLaEg]2/;N C C| L ^~~~~_ STEPS/si/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hz:e140o:f21(:T )warning: unused variable 'flag1' [-Wunused-variable]: stepSiz e140_ | ) { u| i ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~n t 3| 2 group(group_ t data1, flag1,/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h :d33a:t7a:2 ,note: fin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested herel ag2; | ^~~~~ 33 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h : 140 : 28p:r iwarning: munused variable 'data2' [-Wunused-variable]s (tid, n t140h | r e a d su,i n&tr3i2n_gt- >dparteav1,, &frliangg1-,> ndeaxtta,2 ,a rfglsa-g>2s;e n d| b ^~~~~u ff, arg/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.hs:-140>:r35e:c vwarning: bunused variable 'flag2' [-Wunused-variable]u ff, arg s140- | > r e d OupiAnrtg3,2 _0t, daartgas1-,>c fonlnaIgn1d,e xd,a taar2g,s -f>lcaogn2n;I n| d ^~~~~e x); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hNC:C667L:_15P:R OTwarning: Oinitializer order does not match the declaration order [-Wreorder-ctor]_ SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h: 409667: | 52 : note: expanded from macro 'DEFINE_ncclDevFunc't id(tid), 409n | t h r e aRdusn(Wnotrhkrh,r eaadlIgdox,. xp)r,o tgor,o u4p>((g)r.oruupn)(,& n c| c ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~l S h| m tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_e m.work); \ 668| | ^ stepS/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hi:ze667(:s15t:e pnote: Sfield 'nthreads' will be initialized after field 'tidInBlock'i ze_ == 0 ? n667c | c l S h mteimd.(ctoimdm).,b unftfhSriezaedss[(NnCtChLr_ePaRdOsT)O,_ StIiMdPILnEB]l/oNcCkC(Lt_hSrTeEaPdSI/dsxiz.exo)f,( Tg)r o:u ps(tgerpoSuipz)e,_ ) | { ^~~~~~~~~~~~~~~~~ | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h group(group: 667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthre/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.ha:d33s:(7n:t hnote: rin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested heree ads), tidInBlo c33k | ( t h r e a dpIrdixm.sx(t)i,d ,g rnotuhpr(egardosu,p )&,r i n| g ^~~~~~~~~~~- >prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u8, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:2: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f64, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; In file included from | ^/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp :2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f32, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u64, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: In file included from field 'group' will be initialized after field 'stepSize' /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h667: | 167 : /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h : 667t:i15d:( twarning: iinitializer order does not match the declaration order [-Wreorder-ctor]d ), nthreads(nthrea d667s | ) , t itdiIdn(Btliodc)k,( tnhtrheraedaIddsx(.nxt)h,r egardosu)p,( gtrioduIpn)B,l o c| k ^~~~~~~~~~~( threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(R9ed warningusc generatede when compiling for _gfx1100RI. NG_SIMPLE_SumPostDiv_u32, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ tid(/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.ht:i409d:)52,: nnote: texpanded from macro 'DEFINE_ncclDevFunc'h reads(nth r409e | a d s ) ,R utniWdoIrnkBr,o upa(lggroou,p )p,r o t| o ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~, 4| tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_> ().run(&ncclS h668m | e m.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' ste p667S | i z e ( sttiedp(Stiizde)_, =n=t h0r e?a dnsc(cnltShhrmeeamd.sc)o,m mt.ibduIfnfBSliozceks([tNhCrCeLa_dPIRdOxT.Ox_)S,I MgPrLoEu]p/(NgCrCoLu_pS)T,E P S| / ^~~~~~~~~~~~~~~~~s izeo/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.hf:(667T:)60 :: note: sfield 'group' will be initialized after field 'stepSize't epSize_) {667 | | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ t| i group(groupd (tid), nthreads(nthreads), tid/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.hI:n33B:l7o:c k(note: tin instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested hereh readIdx.x), gro u33p | (g r o u p ) ,p r i| m ^~~~~~~~~~~s (tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS9 warnings generated when compiling for host. /sizeof(T) :In file included from s/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f32.cppt:ep1S: iIn file included from z/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.he:_17): In file included from {/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h : 11| : ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h :| 12 group(group: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h::3346::713:: note: warning: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested hereunused function 'log2i' [-Wunused-function] 33 | 46 | s t a t ipcr ilmosn(gt ildo,g 2nit(hlroenagd sn,) &{r i n| g ^~~~~- >prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), In file included from gr/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cppo:u1p: (In file included from g/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hr:o17u: pIn file included from )/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h,: 11: In file included from | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~: 12 : | In file included from tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h :126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h668: | 14 : /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h : 46s:t13e:p Swarning: iunused function 'log2i' [-Wunused-function]z e(stepSize_ 46= | =s t0a t?i cn clcolnSgh mleomg.2cio(mlmo.nbgu fnf)S i{z e s| [ ^~~~~N CCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i32, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1:9 note: warningsin instantiation of member function 'RunWork, 1, 2, 4>::run' requested here generated when compiling for host. 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ 32/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h_:t203 :d66a:t anote: 1in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here, flag1, 203d | a t a 2 , f l aRgu2n;Wo r k| ^~~~~E lement (d)a.trau1n,( wfel)a;g 1 ,| ^d ata2, flag/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp2:;7 : 1| : ^~~~~ note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 7 | DEFINE_ncc l140D | e v F u nuci(nRte3d2u_cte _dRaItNaG1_,S IfMlPaLgE1_,S udmaPtoas2t,D ifvl_aig322;, n| c ^~~~~c lFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_u32, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.xIn file included from ),/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp :g1r: oIn file included from u/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.hp:(17: gIn file included from r/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.ho:u11: pIn file included from )/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h,: 12: In file included from | /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h ^~~~~~~~~~~~~~~~~: 126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h: In file included from :/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h667::37: 60In file included from :/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h :note: 14: field 'group' will be initialized after field 'stepSize'/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h :46:13: warning: unused function 'log2i' [-Wunused-function] 667 | ti d46 | (sttiadti)c, lonntgh lroega2id(sl(onngt hnr) e{a d s| ^~~~~) , tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for host. 9 warnings generated when compiling for host. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i8, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_f8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u32, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sum_f8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u32.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: 9warning: unused variable 'flag1' [-Wunused-variable] warning s generated when compiling for host. 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_i64, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 17 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u8, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 2>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 2>, 2>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 2>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_i64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:147:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 147 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:214:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 2>::runRecv>' requested here 214 | runRecv>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:2: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:147:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 147 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:214:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 2>::runRecv>' requested here 214 | runRecv>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1, 4>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1, 4>, 4>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:203:66: note: in instantiation of member function 'RunWorkElement, 1, 2, 4>::run' requested here 203 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_u64, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:86:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 86 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:226:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 2>::runSend>' requested here 226 | runSend>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:86:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 2>, 1>::Primitives' requested here 86 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:226:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 2>::runSend>' requested here 226 | runSend>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 2>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:406:52: note: expanded from macro 'DEFINE_ncclDevFunc' 406 | RunWork, algo, proto, 2>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/reduce_sumpostdiv_u64.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. 9 warnings generated when compiling for gfx1100. /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:147:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 147 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:214:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 4>::runRecv>' requested here 214 | runRecv>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:147:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 147 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:214:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 4>::runRecv>' requested here 214 | runRecv>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:86:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 86 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:226:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 4>::runSend>' requested here 226 | runSend>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 668 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:86:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 86 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/sendrecv.h:226:9: note: in instantiation of function template specialization 'RunWork, 1, 2, 4>::runSend>' requested here 226 | runSend>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:3:1: note: in instantiation of member function 'RunWork, 1, 2, 4>::run' requested here 3 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_i8, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:409:52: note: expanded from macro 'DEFINE_ncclDevFunc' 409 | RunWork, algo, proto, 4>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/prims_simple.h:667:60: note: field 'group' will be initialized after field 'stepSize' 667 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ 11 warnings generated when compiling for host. In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/gensrc/sendrecv_sum_i8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 11 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 17 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. 9 warnings generated when compiling for gfx1100. [100%] Linking CXX shared library librccl.so /usr/bin/cmake -E cmake_link_script CMakeFiles/rccl.dir/link.txt --verbose=1 /usr/bin/cmake -E time /usr/bin/hipcc -fPIC -O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -parallel-jobs=8 -Xoffload-linker -mllvm=-amdgpu-kernarg-preload-count=16 -Xlinker --dependency-file=CMakeFiles/rccl.dir/link.d -Wl,-z,relro -Wl,--as-needed -Wl,-z,pack-relative-relocs -Wl,-z,now -Wl,-z,now -Wl,--build-id=sha1 -specs=/usr/lib/rpm/redhat/redhat-package-notes -shared -Wl,-soname,librccl.so.1 -o librccl.so.1.0 CMakeFiles/rccl.dir/hipify/src/bootstrap.cc.o CMakeFiles/rccl.dir/hipify/src/channel.cc.o CMakeFiles/rccl.dir/hipify/src/collectives.cc.o CMakeFiles/rccl.dir/hipify/src/debug.cc.o CMakeFiles/rccl.dir/hipify/src/enqueue.cc.o CMakeFiles/rccl.dir/hipify/src/group.cc.o CMakeFiles/rccl.dir/hipify/src/init.cc.o CMakeFiles/rccl.dir/hipify/src/init_nvtx.cc.o CMakeFiles/rccl.dir/hipify/src/net.cc.o CMakeFiles/rccl.dir/hipify/src/msccl.cc.o CMakeFiles/rccl.dir/hipify/src/proxy.cc.o CMakeFiles/rccl.dir/hipify/src/register.cc.o CMakeFiles/rccl.dir/hipify/src/transport.cc.o CMakeFiles/rccl.dir/hipify/src/device/common.cu.cpp.o CMakeFiles/rccl.dir/hipify/src/device/onerank.cu.cpp.o CMakeFiles/rccl.dir/hipify/src/graph/connect.cc.o CMakeFiles/rccl.dir/hipify/src/graph/paths.cc.o CMakeFiles/rccl.dir/hipify/src/graph/rings.cc.o CMakeFiles/rccl.dir/hipify/src/graph/rome_models.cc.o CMakeFiles/rccl.dir/hipify/src/graph/search.cc.o CMakeFiles/rccl.dir/hipify/src/graph/topo.cc.o CMakeFiles/rccl.dir/hipify/src/graph/trees.cc.o CMakeFiles/rccl.dir/hipify/src/graph/tuning.cc.o CMakeFiles/rccl.dir/hipify/src/graph/xml.cc.o CMakeFiles/rccl.dir/hipify/src/misc/alt_rsmi.cc.o CMakeFiles/rccl.dir/hipify/src/misc/archinfo.cc.o CMakeFiles/rccl.dir/hipify/src/misc/argcheck.cc.o CMakeFiles/rccl.dir/hipify/src/misc/api_trace.cc.o CMakeFiles/rccl.dir/hipify/src/misc/ibvsymbols.cc.o CMakeFiles/rccl.dir/hipify/src/misc/ibvwrap.cc.o CMakeFiles/rccl.dir/hipify/src/misc/ipcsocket.cc.o CMakeFiles/rccl.dir/hipify/src/misc/npkit.cc.o CMakeFiles/rccl.dir/hipify/src/misc/nvmlwrap_stub.cc.o CMakeFiles/rccl.dir/hipify/src/misc/param.cc.o CMakeFiles/rccl.dir/hipify/src/misc/profiler.cc.o CMakeFiles/rccl.dir/hipify/src/misc/rocm_smi_wrap.cc.o CMakeFiles/rccl.dir/hipify/src/misc/rocmwrap.cc.o CMakeFiles/rccl.dir/hipify/src/misc/roctx.cc.o CMakeFiles/rccl.dir/hipify/src/misc/shmutils.cc.o CMakeFiles/rccl.dir/hipify/src/misc/signals.cc.o CMakeFiles/rccl.dir/hipify/src/misc/socket.cc.o CMakeFiles/rccl.dir/hipify/src/misc/strongstream.cc.o CMakeFiles/rccl.dir/hipify/src/misc/tuner.cc.o CMakeFiles/rccl.dir/hipify/src/misc/utils.cc.o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_lifecycle.cc.o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_parser.cc.o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_setup.cc.o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_status.cc.o CMakeFiles/rccl.dir/hipify/src/transport/coll_net.cc.o CMakeFiles/rccl.dir/hipify/src/transport/net_tmp.cc.o CMakeFiles/rccl.dir/hipify/src/transport/net_ib.cc.o CMakeFiles/rccl.dir/hipify/src/transport/net_socket.cc.o CMakeFiles/rccl.dir/hipify/src/transport/nvls.cc.o CMakeFiles/rccl.dir/hipify/src/transport/p2p.cc.o CMakeFiles/rccl.dir/hipify/src/transport/shm.cc.o CMakeFiles/rccl.dir/hipify/gensrc/all_gather_sum_i8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_minmax_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_premulsum_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_prod_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sum_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_i8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/all_reduce_sumpostdiv_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/alltoall_pivot_sum_i8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/broadcast_sum_i8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/device_table.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/host_table.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_i8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_MinMax_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_i8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Prod_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_i8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/msccl_kernel_Sum_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_minmax_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_premulsum_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_prod_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_minmax_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_premulsum_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_prod_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f32.cpp.o CMakeFiles/rccl.dir/hipify/gclang++: warning: argument unused during compilation: '-Xarch_host -fstack-protector-strong' [-Wunused-command-line-argument] clang++: warning: argument unused during compilation: '-Xarch_host -fcf-protection' [-Wunused-command-line-argument] clang++: warning: argument unused during compilation: '-specs=/usr/lib/rpm/redhat/redhat-package-notes' [-Wunused-command-line-argument] Elapsed time (seconds): 596.611 ensrc/reduce_scatter_sum_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sum_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_i8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_scatter_sumpostdiv_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_bf8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f16.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_f8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sum_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_i8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u32.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u64.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/reduce_sumpostdiv_u8.cpp.o CMakeFiles/rccl.dir/hipify/gensrc/sendrecv_sum_i8.cpp.o CMakeFiles/rccl.dir/git_version.cpp.o -fgpu-rdc -ldl /usr/lib64/librocm_smi64.so.1.0 /usr/lib64/libamdhip64.so.6.3.42131 --hip-link --offload-arch=gfx1100 -lpthread -lrt -ldl /usr/bin/cmake -E cmake_symlink_library librccl.so.1.0 librccl.so.1 librccl.so gmake[2]: Leaving directory '/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build' [100%] Built target rccl gmake[1]: Leaving directory '/builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build' /usr/bin/cmake -E cmake_progress_start /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/redhat-linux-build/CMakeFiles 0 + RPM_EC=0 ++ jobs -p + exit 0 Executing(%install): /bin/sh -e /var/tmp/rpm-tmp.JU0n2t + umask 022 + cd /builddir/build/BUILD/rccl-6.3.0-build + '[' /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT '!=' / ']' + rm -rf /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT ++ dirname /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT + mkdir -p /builddir/build/BUILD/rccl-6.3.0-build + mkdir /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT + CFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer ' + export CFLAGS + CXXFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer' + export CXXFLAGS + FFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -I/usr/lib64/gfortran/modules ' + export FFLAGS + FCFLAGS='-O2 -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -I/usr/lib64/gfortran/modules ' + export FCFLAGS + VALAFLAGS=-g + export VALAFLAGS + RUSTFLAGS='-Copt-level=3 -Cdebuginfo=2 -Ccodegen-units=1 -Cstrip=none -Cforce-frame-pointers=yes -Clink-arg=-specs=/usr/lib/rpm/redhat/redhat-package-notes --cap-lints=warn' + export RUSTFLAGS + LDFLAGS='-Wl,-z,relro -Wl,--as-needed -Wl,-z,pack-relative-relocs -Wl,-z,now -Wl,-z,now -Wl,--build-id=sha1 -specs=/usr/lib/rpm/redhat/redhat-package-notes ' + export LDFLAGS + LT_SYS_LIBRARY_PATH=/usr/lib64: + export LT_SYS_LIBRARY_PATH + CC=hipcc + export CC + CXX=hipcc + export CXX + cd rccl-rocm-6.3.0 + DESTDIR=/builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT + /usr/bin/cmake --install redhat-linux-build -- Install configuration: "RelWithDebInfo" -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/lib64/librccl.so.1.0 -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/lib64/librccl.so.1 -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/lib64/librccl.so -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/include/rccl/rccl.h -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/include/rccl/nccl_net.h -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/include/rccl/amd_detail/api_trace.h -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-algorithms -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-algorithms/allreduce-allpairs-8n-ll-32tb-op.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-algorithms/allreduce-allpairs-8n-ll-32tb.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-algorithms/allreduce-allpairs-8n-ll-64tb-op.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-algorithms/allreduce-allpairs-8n-ll-64tb.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-algorithms/allreduce-allpairs-8n-simple-op.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-algorithms/allreduce-allpairs-8n-simple.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-algorithms/allreduce-allpairs-8n-simple_2.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-algorithms/alltoall-8n-0-9kb.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-algorithms/alltoall-8n-190kb-512kb.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-algorithms/alltoall-8n-512kb-7mb.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-algorithms/alltoall-8n-7mb-43mb.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-algorithms/alltoall-8n-9kb-190kb.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-unit-test-algorithms -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-unit-test-algorithms/all-reduce-ring-ll.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-unit-test-algorithms/all-reduce-ring-ll128.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/rccl/msccl-unit-test-algorithms/all-reduce-ring-simple.xml -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/lib64/cmake/rccl/rccl-targets.cmake -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/lib64/cmake/rccl/rccl-targets-relwithdebinfo.cmake -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/lib64/cmake/rccl/rccl-config.cmake -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/lib64/cmake/rccl/rccl-config-version.cmake -- Installing: /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/doc/rccl/LICENSE.txt + echo s@/builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT@@ + find /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/lib64 -name '*.so.*.[0-9]' + sed -f br.sed + find /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/lib64 -name '*.so.[0-9]' + sed -f br.sed + sed -f br.sed + find /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/lib64 -name '*.so' + find /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/lib64 -name '*.cmake' + sed -f br.sed + '[' -f /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/doc/rccl/LICENSE.txt ']' + rm /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/doc/rccl/LICENSE.txt + /usr/bin/find-debuginfo -j48 --strict-build-id -m -i --build-id-seed 6.3.0-1.fc42 --unique-debug-suffix -6.3.0-1.fc42.x86_64 --unique-debug-src-base rccl-6.3.0-1.fc42.x86_64 --run-dwz --dwz-low-mem-die-limit 10000000 --dwz-max-die-limit 110000000 -S debugsourcefiles.list /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0 find-debuginfo: starting Extracting debug info from 1 files DWARF-compressing 1 files dwz: ./usr/lib64/librccl.so.1.0-6.3.0-1.fc42.x86_64.debug: Unknown debugging section .debug_str_offsets sepdebugcrcfix: Updated 0 CRC32s, 1 CRC32s did match. Creating .debug symlinks for symlinks to ELF files Copying sources found by 'debugedit -l' to /usr/src/debug/rccl-6.3.0-1.fc42.x86_64 find-debuginfo: done + /usr/lib/rpm/check-buildroot + /usr/lib/rpm/redhat/brp-ldconfig + /usr/lib/rpm/brp-compress + /usr/lib/rpm/redhat/brp-strip-lto /usr/bin/strip + /usr/lib/rpm/brp-strip-static-archive /usr/bin/strip + /usr/lib/rpm/check-rpaths + /usr/lib/rpm/redhat/brp-mangle-shebangs + /usr/lib/rpm/brp-remove-la-files + env /usr/lib/rpm/redhat/brp-python-bytecompile '' 1 0 -j48 + /usr/lib/rpm/redhat/brp-python-hardlink + /usr/bin/add-determinism --brp -j48 /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT Scanned 38 directories and 313 files, processed 0 inodes, 0 modified (0 replaced + 0 rewritten), 0 unsupported format, 0 errors Reading /builddir/build/BUILD/rccl-6.3.0-build/SPECPARTS/rpm-debuginfo.specpart Processing files: rccl-6.3.0-1.fc42.x86_64 Executing(%license): /bin/sh -e /var/tmp/rpm-tmp.ZQxubX + umask 022 + cd /builddir/build/BUILD/rccl-6.3.0-build + cd rccl-rocm-6.3.0 + LICENSEDIR=/builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/licenses/rccl + export LC_ALL=C.UTF-8 + LC_ALL=C.UTF-8 + export LICENSEDIR + /usr/bin/mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/licenses/rccl + cp -pr /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/LICENSE.txt /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/licenses/rccl + RPM_EC=0 ++ jobs -p + exit 0 Provides: librccl.so.1()(64bit) rccl = 6.3.0-1.fc42 rccl(x86-64) = 6.3.0-1.fc42 Requires(rpmlib): rpmlib(CompressedFileNames) <= 3.0.4-1 rpmlib(FileDigests) <= 4.6.0-1 rpmlib(PayloadFilesHavePrefix) <= 4.0-1 Requires: ld-linux-x86-64.so.2()(64bit) ld-linux-x86-64.so.2(GLIBC_2.3)(64bit) libamdhip64.so.6()(64bit) libamdhip64.so.6(hip_4.2)(64bit) libamdhip64.so.6(hip_4.3)(64bit) libamdhip64.so.6(hip_4.5)(64bit) libamdhip64.so.6(hip_5.0)(64bit) libamdhip64.so.6(hip_5.3)(64bit) libamdhip64.so.6(hip_6.0)(64bit) libc.so.6()(64bit) libc.so.6(GLIBC_2.10)(64bit) libc.so.6(GLIBC_2.14)(64bit) libc.so.6(GLIBC_2.16)(64bit) libc.so.6(GLIBC_2.17)(64bit) libc.so.6(GLIBC_2.2.5)(64bit) libc.so.6(GLIBC_2.3)(64bit) libc.so.6(GLIBC_2.3.2)(64bit) libc.so.6(GLIBC_2.3.4)(64bit) libc.so.6(GLIBC_2.32)(64bit) libc.so.6(GLIBC_2.33)(64bit) libc.so.6(GLIBC_2.34)(64bit) libc.so.6(GLIBC_2.38)(64bit) libc.so.6(GLIBC_2.4)(64bit) libc.so.6(GLIBC_2.6)(64bit) libc.so.6(GLIBC_2.7)(64bit) libc.so.6(GLIBC_ABI_DT_RELR)(64bit) libgcc_s.so.1()(64bit) libgcc_s.so.1(GCC_12.0.0)(64bit) libgcc_s.so.1(GCC_3.0)(64bit) libm.so.6()(64bit) libm.so.6(GLIBC_2.2.5)(64bit) librocm_smi64.so.1()(64bit) libstdc++.so.6()(64bit) libstdc++.so.6(CXXABI_1.3)(64bit) libstdc++.so.6(CXXABI_1.3.7)(64bit) libstdc++.so.6(GLIBCXX_3.4)(64bit) libstdc++.so.6(GLIBCXX_3.4.11)(64bit) libstdc++.so.6(GLIBCXX_3.4.18)(64bit) libstdc++.so.6(GLIBCXX_3.4.19)(64bit) libstdc++.so.6(GLIBCXX_3.4.21)(64bit) libstdc++.so.6(GLIBCXX_3.4.22)(64bit) libstdc++.so.6(GLIBCXX_3.4.26)(64bit) libstdc++.so.6(GLIBCXX_3.4.29)(64bit) libstdc++.so.6(GLIBCXX_3.4.30)(64bit) libstdc++.so.6(GLIBCXX_3.4.32)(64bit) libstdc++.so.6(GLIBCXX_3.4.9)(64bit) Processing files: rccl-devel-6.3.0-1.fc42.x86_64 Executing(%doc): /bin/sh -e /var/tmp/rpm-tmp.al3TUh + umask 022 + cd /builddir/build/BUILD/rccl-6.3.0-build + cd rccl-rocm-6.3.0 + DOCDIR=/builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/doc/rccl-devel + export LC_ALL=C.UTF-8 + LC_ALL=C.UTF-8 + export DOCDIR + /usr/bin/mkdir -p /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/doc/rccl-devel + cp -pr /builddir/build/BUILD/rccl-6.3.0-build/rccl-rocm-6.3.0/README.md /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT/usr/share/doc/rccl-devel + RPM_EC=0 ++ jobs -p + exit 0 Provides: cmake(rccl) = 2.21.5 rccl-devel = 6.3.0-1.fc42 rccl-devel(x86-64) = 6.3.0-1.fc42 Requires(rpmlib): rpmlib(CompressedFileNames) <= 3.0.4-1 rpmlib(FileDigests) <= 4.6.0-1 rpmlib(PayloadFilesHavePrefix) <= 4.0-1 Requires: cmake-filesystem(x86-64) librccl.so.1()(64bit) Processing files: rccl-data-6.3.0-1.fc42.noarch Provides: rccl-data = 6.3.0-1.fc42 Requires(rpmlib): rpmlib(CompressedFileNames) <= 3.0.4-1 rpmlib(FileDigests) <= 4.6.0-1 rpmlib(PayloadFilesHavePrefix) <= 4.0-1 Processing files: rccl-debugsource-6.3.0-1.fc42.x86_64 Provides: rccl-debugsource = 6.3.0-1.fc42 rccl-debugsource(x86-64) = 6.3.0-1.fc42 Requires(rpmlib): rpmlib(CompressedFileNames) <= 3.0.4-1 rpmlib(FileDigests) <= 4.6.0-1 rpmlib(PayloadFilesHavePrefix) <= 4.0-1 Processing files: rccl-debuginfo-6.3.0-1.fc42.x86_64 Provides: debuginfo(build-id) = b8c9614542e08ddf38409a90f8c3993090fb3d26 librccl.so.1.0-6.3.0-1.fc42.x86_64.debug()(64bit) rccl-debuginfo = 6.3.0-1.fc42 rccl-debuginfo(x86-64) = 6.3.0-1.fc42 Requires(rpmlib): rpmlib(CompressedFileNames) <= 3.0.4-1 rpmlib(FileDigests) <= 4.6.0-1 rpmlib(PayloadFilesHavePrefix) <= 4.0-1 Recommends: rccl-debugsource(x86-64) = 6.3.0-1.fc42 Checking for unpackaged file(s): /usr/lib/rpm/check-files /builddir/build/BUILD/rccl-6.3.0-build/BUILDROOT Wrote: /builddir/build/RPMS/rccl-devel-6.3.0-1.fc42.x86_64.rpm Wrote: /builddir/build/RPMS/rccl-debugsource-6.3.0-1.fc42.x86_64.rpm Wrote: /builddir/build/RPMS/rccl-debuginfo-6.3.0-1.fc42.x86_64.rpm Wrote: /builddir/build/RPMS/rccl-data-6.3.0-1.fc42.noarch.rpm Wrote: /builddir/build/RPMS/rccl-6.3.0-1.fc42.x86_64.rpm Child return code was: 0